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□ specifier=address+( size/2) +( width /2) 
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| depth = 4 bytes 



width = 16 bytes]— J\ |s/> * = depth x width = 64 W» \ 




address is aligned to size (64 bytes), 
so low-order 6 bits are zero 



address \ aaaaaaaaaaaaaaaaaaaaaaoaaaaaaaaag aaaa \ OOOOQQ\ 
size/2 I OOOOOOOOOOOOOOOOOOOOOOOOOOOOOOOQo \ WOOOO] 



width/2 \OOOOO0OO0OOO0OOO0OOO00000O00OO0OQ 



specifier 
500 



aaaaaaaaaaaaaaaaoaaaaaaaaaaaaaaaaaaaa I 101000 I 
^ ' ^ 1 

505 



FIG. 5 



510 



600 



specifier \ aaaaaaaaaaaaaaaoaaaaaaaaaaa aaaaaa aaaa \ jqjqqq \/~ 

- ^ — =L 

g/5 ^ H Tand (0-s) | 



610 



605 



width/2 \ OOOOOOOOOOOOOOOOOOOOOOOOOOOOOOOOQ \ q oiqOO I 

620 625^ \ s and not (width /2)\ 



t | ooaaaaoooaoaaoaaooaoaoaaoaooooaaoaooQ WOOOO [ 
s/ze/? | OOOOOOOOOOOOOOOOOOOOOOOOOO OOOOQOO 1 100000 \ 

^ ' — I ' J 

640 645 ^ t and not (siz e/2) \ 

address \ aaaaaaaaaaaaaaaaaaaaoaaaaaaaa aaaaaaaa \ OOOOOO] 

650 



FIG. 6 
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Register operand 
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Owmc.c contents 



□ wmc.pa- physical address 
Owmc. size- size of contents 
Qwmc.cv- con tents valid 
Qwmc.th- thread last used 

□ wmc.reg-register last used 
Owmc.rtv-register & thread valid 
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local virtual address 



local virtual 
to global 
virtual 
address 

translation 



giooai virtual address 



global 
virtual to 
physical 
address 
translation 



physical address 



address 



cache data 



address cache tag 



memory management organization 
Fig. 14 
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protection 

global 
"protection 
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'protection 



63 
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40 
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def data v flags <- AccessPhysicalLTB(pa,op,wdata) as 

th*-pa23..l9 
en <- pafr.4 

if (en < (1 || 0 LE )) and (th < T) and (pa 18 ..6=0) then 
case op of 
R: 

data <- 0 64 || LTBArray[th][en] 

W: 

LocalTBlui][en] <- wdata63..o 

endcase 

else 

data <- 0 

end'if 
enddef 

Fig. 16 
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Fig. 20 
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d f ga.LocalProtect LocalTranslation(th,ba,la,pl) as 
if LB & (ba63..48 © Ia63..48) then 

raise AccessDisallowedByVirtualAddr ss 

end if 

me <- NONE 
fori<-0to (1 || 0 LE H 

if (Iae3..48 & -LocalTB[th][0 6 3..48) = LocalTB[th][i]47..32 then 
me<-i 

endif 
endfor 

if me = NONE then 

if -Control Registerpj+e then 
raise LocalTBMiss 

endif 
ga <- la 

Local Protect +- 0 

else 

ga <- (V363..48 A LocalTB[th][me] 31 .. 16 ) II va4 7 ..o 
LocalProtect <- LocalTB[th][me]i5..o 

endif 
enddef 

Fig. 22 
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Fig. 23 



def data,flags <- AccessPhysicalGTB(pa,op,wdata) as 
th <r- pa 2 3..i9+GT II 0 GT 
en4-pa] 8 ..4 

if (en < (1 1| 0 G )) and (th < T) and (pa 18 +GT..i9 = 0) then 
case op of 
R: 

data <- GTBArray[th 5 ..GT][en] 

W: 

GTBArray[th5..GT][en] <- wdata 

endcase 

else 

data 0 

endif 

enddef 

Fig. 24 
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Fig. 25 



def pa.GlobalProtect <- GlobalAddressTranslation(th f ga f pl,lda) as 
me <- NONE 
fori<-0to(1 ||0 G )-1 

if GlobalTB[th5..GT][>] * 0 then 

size <- (GlobalTB[th 5 ..GT]Pl63..7 and (O^-GlobarrBfth^GTlPte.^)) II 0 8 
if <(ga63..8l|0 8 ) A (GlobalTBtth 5 .. G T][il63..8l|0 8 )) and (O^-size)) = 0 then 
me <- GlobalTB[th5..GT]tO 

endif 

endif 
endfor 

if me = NONE then 
if Ida then 

PerformAccessDetail(AccessDetailRequiredByLocalTB) 

endif 

raise GlobalTBMiss 

else 

pa <- (ga 6 3..8 A C3lobalTB[th 5 ..GT][me]i27..T2) II 937..0 

GlobalProtect <- GlobalTB[th5..GT][me]71..64 II 0 1 II GlobalTB[th5..GTl[^e]6..0 

endif 
enddef 

Fig. 26 



def GTBUpdateWrite(th,fill,data) as 
me <- NONE 
fori«-0to(1 || 0 G )-1 

siz <- (GlobalTB[th 5 ..GT][i]63..7 and (0 64 -GlobalTB(th 5 ..GT][063..7)) II 0 8 
if ((data 63 .. 8 ||0 8 ) A (GlobalTB[th 5 .. G T][063..8l|O 8 )) and (O^-size) = 0 then 
me<-i 

endif 
endfor 

if me = NONE then 
if fill then 

GlobalTB[th 5 ..GT][GTBLast[th 5 ..GT]] <- data 
GTBLast[th 5 .. G T] «- (GTBLast[th 5 .. G T] + 1)g-1..0 
if GTBLast[th 5 ..GT] - 0 then 

GTBLast[th 5 ..GTl «- GTBFirst[th5..GTl 

GTBBump[th5..GT] «- 1 

endif 

endif 

else 

GlobalTB[th5..GT][me] <- data 

endif 
enddef 

Fig. 27 
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def data.fiags <- AccessPhysicalGTBR gisters(pa,op,wdata) as 
th <- pa23..19+GT II 0 GT 
rn <- paia..8 

if (rn < 5) and (th < T) and (paie+GT..19 = 0) and (pa 7 .. 4 = 0) then 
case m || op of 
0 1| R, 1 || R: 

data 4-0 
0 1| W, 1 || W: 

GTBUpdateWrite(th,rno,wdata) 

2 1| R: 

data O 64 " 0 || GTBLast[th 5 „GT] 
2||W: 

GTBLast[th5..GTl «- wdataG-i..o 
3 II R: 

data <- O 64 ' 6 || GTBFirst[th 5 ..GT] 
3||W: 

GTBFirst[th5..GTl <- w dataG-i..o 
3||R: 

data <- 0 63 1| GTBBump[th5..GT] 
3||W: 

GTBBump[th5..GTl «- wdatao 

endcase 

else 

data <- 0 

endif 
enddef 



Fig. 30 



I G.BOOLEAN I Group Boolean 



Equivalencies 



G.AAA 


Group three-way and 


G.AAA.1 


Group add add add bits 


G.AAS.1 


Group add add subtract bits 


G.ADD.1 


Group add bits 


G.AND 


Group and 


G.ANDN 


Group and not 


G.COPY 


Group copy 


G.NAAA 


Group three-way nand 


G.NAND 


Group nand 


G.NOOO 


Group three-way nor 


G.NOR 


Group nor 


G.NOT 


Group not 


G.NXXX 


Group three-way exclusive-nor 


G.000 


Group three-way or 


G.OR 


Group or 


G.ORN 


Group or not 


G.SAA.1 


Group subtract add add bits 


G.SAS.1 


Group subtract add subtract bits 


G.SET 


Group set 


G.SET.AND.E.1 


Group set and equal zero bits 


G.SET.AND.NE.1 


Group set and not equal zero bits 


G.SET.E.1 


Group set equal bits ! 


G.SET.G.1 


Group set greater signed bits 


G.SET.G.U.1 


Group set greater unsigned bits 


G.SET.G.Z.1 


Group set greater zero signed bits 


G.SET.GE.1 


Group set greater equal signed bits 


G.SET.GE.Z.1 


Group set greater equal zero signed bits 


G.SET. LI 


Group set less signed bits 


G.SET.LZ.1 


Group set less zero signed bits 


G.SET.LE.1 


Group set less equal signed bits 


G.SET.LE.U.1 


Group set less equal unsigned bits 


G.SET.LE.Z.1 


Group set less equal zero signed bits 


G.SET.NE.1 


Group set not equal bits 


G.SET.GE.U.1 


Group set greater e jual unsigned bits 


G.SET.L.U.1 


Group set less unsigned bits 



Fig. 31A 



G.SSA.1 


Group subtract subtract add bits 


G.SSS.1 


Group subtract subtract subtract bits 


G.SUB.1 


Group subtract bits 


G.XNOR 


Group exclusive-nor 


G.XOR 


Group exclusive-or 


G.XXX 


Group three-way exclusive-or 


G.ZERO 


Group zero 




G.AAA rd@rc,rb 


<— 


G.BOOLEAN rd@rc,rb,0b10000000 


G.AAA.1 rd@rc,rb 


-> 


G.XXX rd@rc,rb 


G.AAS.1 rd@rc,rb 


—> 


G.XXX rd@rc,rb | 


G.ADD.1 rd=rc,rb 


— > 


G.XOR rd=rc,rb 


G.AND rd=rc,rb 


<— 


G.BOOLEAN rd@rc,rb.0b1 0001 000 


G.ANDN rd=rc,rb 


«— 


G.BOOLEAN rd@rc,rb,0b01000100 


G.BOOLEAN rd@rb,rc,i 


-> 


G.BOOLEAN rd@rc,rb,i7i5ifii4i3ii i2'0 


G.COPYrd=rc 


<- 


G.BOOLEAN rd@rc,rc,0b1 0001 000 


G.NAAA. rd@rc,rb 


<- 


G.BOOLEAN rd@rc,rb,0b01 111111 


G.NAND rd-rc,rb 


<— 


G.BOOLEAN rd@rc,rb,0b01 1 101 1 1 


G.NOOO rd@rc,rb 


<— 


G.BOOLEAN rd@rc,rb,0b00000001 


G.NOR rd=rc,rb 


<— 


G.BOOLEAN rd@rc,rb,0b00010001 


G.NOTrd=rc 


4- 


G.BOOLEAN rd@rc,rc,0b00010001 


G.NXXX rd@rc,rb 


<- 


G.BOOLEAN rd@rc,rb,0b01 101001 


G.000 rd@rc,rb 


<- 


G.BOOLEAN rd@rc,rb,0b1 1111110 


G.ORrd=rc,rb 


<- 


G.BOOLEAN rd@rc,rb,0b1 1 1 01 1 1 0 


G.ORN rd=rc,rb 


<- 


G.BOOLEAN rd@rc,rb,0b1 101 1101 


G.SAA.1 rd@rc,rb 


-> 


G.XXX rd@rc.rb 


G.SAS.1 rd@rc,rb 


-> 


G.XXX rd@rc,rb 


G.SETrd 


<— 


G.BOOLEAN rd@rd,rd,0b10000001 


G.SET.AND.E.1 rd=rb,rc -> 


G.NAND rd=rc,rb 


G.SET.AND.NE.1 rd-rb,rc -» 


G.AND rd=rc,rb 


G.SET.E.1 rd=rb,rc 


-> 


G.XNOR rd=rc,rb 


G.SET.G.1 rd=rb,rc 


-> 


G.ANDN rd=rc,rb 


G.SET.G.U.1 rd=rb,rc 


-> 


G.ANDN rd=rb,rc 


G.SET. G.Z. 1 rd=rc 


-> 


G.ZERO rd 


G.SET.GE.1 rd-rb,rc 


-> 


G.ORN rd=rc,rb 


G. SET. GE. Z. 1 rd=rc 


-> 


G.NOT rd=rc 



Fig. 31 A (cont'd) 



G.SET.L1 rd=rb,rc 


-> 


G.ANDN rd=rb.rc 


G.SET.LZ.1 rd=rc 


— > 


G.COPY rd=rc 


G.SET.LE.1 rd=rb,rc 


— > 


G.ORN rd=rb,rc 


G.SET.LE.U.1 rd=rb,rc 


-> 


G.ORN rd=rc,rb 


G.SET.LE.Z.1 rd=rc 


-> 


G.SET rd 


G.SET.NE.1 rd=rb,rc 


-» 


G.XOR rd=rc,rb 


G. SET. GE. U. 1 rd-rb,rc 


-> 


G.ORN rd=rb,rc 


G.SET.L.U.1 rd-rb,rc 


-> 


G.ANDN rd=rc,rb 


G.SSA.1 rd@rc,rb 


-> 


G.XXX rd@rc,rb 


G.SSS.1 rd@rc,rb 


-> 


G.XXX rd@rc,rb 


G.SUB.1 rd=rc,rb 


-> 


G.XOR rd=rc,rb 


G.XNOR rd=rc,rb 


<— 


G. BOOLEAN rd@rc,rb,0b1 001 1001 


G.XOR rd-rc,rb 


<— 


G.BOOLEAN rd@rc,rb,0b01100110 


G.XXXrd@rc.rb 


<— 


G.BOOLEAN rd@rc,rb,0b10010110 


G.ZERO rd 




G.BOOLEAN rd@rd,rd,0b00000000 



Selection 



operation 


function (binary) 


function (decimal) 


d 


11110000 


240 


c 


11001100 


204 | 


b 


10101010 


176 


d&c&b 


10000000 


128 


(d&c)|b 


11101010 


234 


dlclb 


11111110 


254 


d?c:b 


11001010 


202 


d^ 


10010110 


150 | 


~d A c A b 


01101001 


105 


0 


00000000 


0 



Fig. 31 A (cont'd) 



Format 

G.BOOLEANrd@trc,trb,f 
rd=gbooleani(rd,rc,rb,f) 

31 252423 18 17 12 11 65 0 

| (Tboolean |jh| rd | rc | rb | il | 

7 1 6 6 6 6 

if f6=f5 then 

iff2=fithen 
if f2 then 

rc <- max(trc,trb) 
rb <- min(trc.trb) 

else 

rc <- min(trc.trb) 
rb <- max(trc,trb) 

endif 
ih<-0 

il^0||f6||f7||f4l|f3l|f0 

else 

if f2 then 

rc«-trb 
rb<-trc 

else 

rc <r- trc 
rb«-trb 

endif 
ih<-0 

il<-1||f6l|f7l|f4l|f3l|f0. 

endif 

else 

ih«-1 
if f6 then 

rc <- trb 
rb<-trc 

il<-fll|f2l|f7l|f4||f3l|f0 

else 

rc <- trc 
rb<-trb 

il*-f2l|fll|f7l|f4l|f3l|fo 

endif 

endif 



Definition 

def GroupBoolean (ih,rd t rc t rb f il) 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
if ih=0 then 

if il5=0 then 

f*-«3 II »4 II «4 II "2 II »1 II (rorb)* || il 0 

else 

f <- n 3 1| iu || iW II fell ni no || 1 ||n 0 

endif 

else 

f<-il3l|0||1||ir 2 ||ili||il5l|il4l|Ho 

endif 

fori<-0to 127 by size 

ai^f(di||c ( ||bi) 
endfor 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

none 



Fig. 31C 



Operation codes 



IG.MUX 


Group multiplex 


1 


Redundanci s 


G.MUX ra=rd,rc,rc 


<=> 


G.COPYra-rc 


G.MUX ra=ra f rc,rb 


o 


G.BOOLEAN ra@rc,rb,0x1 1001010 | 


G.MUX ra=rd,ra,rb 


<=> 


G.BOOLEAN ra@rd,rb,0x1 1 1 0001 0 | 


G.MUX ra=rd,rc,ra 


o 


G.BOOLEAN ra@rd,rc,0x1 101 1000 


G.MUX ra=rd,rd,rb 


o 


G.OR ra=rd,rb 


G.MUX ra=rd,rc,rd 


o 


G.AND ra=rd,rc 



Format 



G.MUX ra=rd,rc,rb 
ra=gmux(rd,rc,rb) 

31 24 23 18 17 12 11 6 5 0 

I" G.MUX | rd | re I rb | ra I 

8 6 6 6 6 

Fig. 31D 



Definition 

def GroupTernaryfop.size.rd.rc.rt^ra) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case op of 
G.MUX: 

a <- (c and d) or (b and not d) 

endcase 

RegWrite(ra, 128, a) 
enddef 

Exceptions 

none 

Fig. 31D 



c* Ann ft 


Groun add bvtes 


Ann ir 


Groun add doublets 


Ann ^9 


Groun add ouadlets 


c> Ann R4 


Groun add octlets 


ft Ann 19ft 


Groun add hexlet 


ft Ann i ft 


Groun add limit tinned bvtps 

vlwU^ OUU III 1 Hi Oiyi icvj IvO 


ft Ann i ir 

O.nUU.L. ID 


ftroun add limit ^ionpd dnuhlpta 
v?iuup auu hi tin oiyi ic?u vjuuuiuvo 


Ann i ^9 


Groun add limit tinned nuadlpfc 

wlUUU QuU III llll Oiyi IwU VjUaUICld 


ri Ann I ra 


ftrnim add limit cinnpd optlptc 

V?IUU}J dVJVJ III llll Oiyi IC7U vVilClO 


ft Ann i 19ft 

O.nUU.L I^O 


Groi in add limit ^ionpd hpylpt 

\Jl WUp CIvJVJ III llll Oiyi IwU 1 IvAICl 


o Ann i lift 

U.MUU.LU.O 


ftrni in add limit i mQinnpd bx/tPQ 

VJI vU^ avJVJ III llll Ul 191^1 IvU uyico 


Ann I 1 1 1ft 

U.MUU.LU. ID 


ftroun add limit unQinnpd dnuhlptQ 

Vj 1 \JLI|J ClUu III llll UllOiyilOU UvUUIClO 


ft Ann i 1 1 ^9 


Groun add limit unpinned nuadlpte 

VI vtip OUU III llll Ul IvIVJI IvVJ UUQUIwlO 


Ann i 1 1 


Groun add limit unpinned ortlpte 

\*s 1 OUU III llll Ul lOiy 1 IwU V/vllwlO 


ft Ann i 1 1 19ft 


ftroun add limit unQionpd hpylpt 

\Jl vvip aUU III llll Ul lOiyi IwU 1 ICAIvl 


ft Ann ft n 


ftrnun add Qionpd hx/tPQ phpnlc ovprflow 
vji \J\J\J auu oiy i iwu uy iwo uiivuv uvci t iuw 


ft Ann 1ft n 


ft rot in add ^ionpd dnublpfc phpnk ovprflow 
viuuu auu oiy i icu uuuuicio uiiwUfx uvci iikjvj 


ft Ann ^9 n 


ftrmm Add cinnpd niiadlptc phpeW nvprflouv 
viuuu auu oiy i icu vjuauiwio uiiouiv uvciiivw 


Ann ftA o 


ft mi in sadH cinnoH o^tlotc rhorlf nvo rfl r\\Ai 
oiuuu auu oiyiicu Uwiicio viit7Ui\ uvci i iuw 


G ADD 128 O 

\J ./\L«/ L-/ . 1 £.U»Vy 


GrouD add sianed hexlet check overflow 


G.ADD.U.8.0 


Group add unsigned bytes check overflow 


G.ADD.U.16.0 


Group add unsigned doublets check overflow 


G.ADD.U.32.0 


Group add unsigned quadlets check overflow 


G.ADD.U.64.0 


Group add unsigned octlets check overflow 


G.ADD.U.128.0 


Group add unsigned hexlet check overflow 



Fig. 32A 



Format 



G.op.size rd=rc,rb 
rd=gopsize(rc,rb) 

31 24 23 18 17 12 11 6 5 0 

| G.size | rd | rc | rb | op | 

8 6 6 6 6 



Fig. 32B 



D finition 



def Groupfop.size.rd.rc.rb) 
c«- RegRead(rc, 128) 
b <r- RegRead(rb, 128) 
case op of 
G.ADD: 

for i <- 0 to 1 28-size by size 

ai+size-1..i «- Ci+size-1..i + t>i+size-1..i 
endfor 
G.ADD.L: 

for i 4- 0 to 1 28-size by size 

1 «- (q+size-1 II Cj+size-l.j) + (&i+size-1 II bi+size-1..i) 

ai+size-1..i <~ Osize * *size-l) ? (t S fee II t||&1) : *size-1..0 
endfor 
G.ADD.LU: 

for i <- 0 to 1 28-size by size 

t <- (0 1 || c l+siz e-i..i) + (0 1 || bj+sfee-u) 

aj+size-1..i *- (tsize * 0) ? (1 slze ) : t S ize-1..0 
endfor 
GADD.O: 

for i <- 0 to 1 28-size by size 

t *- (Ci+size-1 II C|+size-1..i) + (&i+size-1 II &i+size-1..i) 
if tsize * t S | ze -i then 

raise FixedPointArithmetic 

endif 

ai+size-1..i<-tsize-1..0 
endfor 
G.ADD.U.O: 

for i <- 0 to 1 28-size by size 

t <- (0 1 || q+size-1 ..i) + (0 1 || bj+ S ize-1..i) 

if tsize * 0 then 

raise FixedPointArithmetic 

endif 

ai+size-1..i<- t size-1..0 
endfor 

endcase 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Fixed-point arithmetic 



Fig. 32C 



Operation codes 



G.SET.AND.E.8 1 


Group set and equal zero bytes 


G.SET.AND.E.16 


Group set and equal zero doublets 


G.SET.AND.E.32 


Group set and equal zero quadlets 


G.SET.AND.E.64 


Group set and equal zero octlets 


G.SET.AND.E.128 


Group set and equal zero hexlet 


G.SET.AND.NE.8 


Group set and not equal zero bytes 


G.SET.AND.NE.16 


Group set and not equal zero doublets 


G.SET.AND.NE.32 


Group set and not equal zero quadlets 


G.SET.AND.NE.64 


Group set and not equal zero octlets 


G.SET.AND.NE. 1 28 


Group set and not equal zero hexlet 


G.SET.E.8 


Group set equal bytes 


G.SET.E.16 


Group set equal doublets 


G.SET.E.32 


Group set equal quadlets 


G.SET.E.64 


Group set equal octlets 


G.SET.E.128 


Group set equal hexlet 


G.SET.GE.8 


Group set greater equal signed bytes 


G.SET.GE.16 


Group set greater equal signed doublets 


G.SET.GE.32 


Group set greater equal signed quadlets 


G.SET.GE.64 


Group set greater equal signed octlets 


G.SET.GE.128 


Group set greater equal signed hexlet 


G.SET.GE.U.8 


Group set greater equal unsigned bytes 


G.SET.GE.U.16 


Group set greater equal unsigned doublets 


G.SET.GE.U.32 


Group set greater equal unsigned quadlets 


G.SET.GE.U.64 


Group set greater equal unsigned octlets 


G.SET.GE.U.128 


Group set greater equal unsigned hexlet 


G.SET.L.8 


Group set signed less bytes 


G.SET.L.16 


Group set signed less doublets 


G.SET.L.32 


Group set signed less quadlets 


G.SET.L.64 


Group set signed less octlets 


G.SET.L.128 


Group set signed less hexlet 


G.SET.L.U.8 


Group set less unsigned bytes 


G.SET.LU.16 


Group set less unsigned doublets 


G.SET.L.U.32 


Group set less unsigned quadlets ! 


G.SET.L.U.64 


Group set less unsigned octlets 


G.SET.L.U.128 


Group set less unsigned hexlet | 


G.SET.NE.8 


Group set not equal bytes 


G.SET.NE.16 


Group set not equal doublets 



Fig. 33A 



G.SET.NE.32 


Group set not equal quadlets 


G.SET.NE.64 


Group set not equal octlets 


G.SET.NE.128 


Group set not equal hexlet 


G.SUB.8 


Group subtract bytes 


G.SUB.8.0 


Group subtract signed bytes check overflow ! 


G.SUB.16 


Group subtract doublets 


G.SUB.16.0 


Group subtract signed doublets check overflow 


G.SUB.32 


i * _ ft • | ft 

Group subtract quadlets 


G.SUB.32.0 


Group subtract signed quadlets check overflow 


G.SUB.64 


Group subtract octlets 


G.SUB.64.0 


Group subtract signed octlets check overflow 


G.SUB.128 


Group subtract hexlet 


G.SUB.128.0 


Group subtract signed hexlet check overflow 


G.SUB.L.8 


Group subtract limit signed bytes 


G.SUB.L16 


ft ■ A *9 * ft ft ft t * 

Group subtract limit signed doublets 


G.SUB.L32 


Group subtract limit signed quadlets 


G.SUB.L.64 


Group subtract limit signed octlets 


G.SUB.L128 


Group subtract limit signed hexlet 


G.SUB.L.U.8 


Group subtract limit unsigned bytes 


G.SUB.L.U.16 


Group subtract limit unsigned doublets 


G.SUB.L.U.32 


Group subtract limit unsigned quadlets 


G.SUB.LU.64 


Group subtract limit unsigned octlets 


G.SUB.LU.128 


Group subtract limit unsigned hexlet 


G.SUB.U.8.0 


Group subtract unsigned bytes check overflow 


G.SUB.U.16.0 


Group subtract unsigned doublets check overflow 


G.SUB.U.32.0 


Group subtract unsigned quadlets check overflow 


G.SUB.U.64.0 


Group subtract unsigned octlets check overflow 


G.SUB.U.128.0 


Group subtract unsigned hexlet check overflow ; 



Fig. 33A (cont'd) 



Equivalencies 



G SET.E.Z.8 


Group set equal zero bytes 


G.SET.E.Z.16 


Group set equal zero doublets 


G.SET.E.Z.32 


Group set equal zero quadlets 


G.SET.E.Z.64 


Group set equal zero octlets 


G.SET.E.Z.128 


Group set equal zero hexlet 


G.SET.G.Z.8 


Group set greater zero signed bytes 


G.SET.G.Z.16 


Group set greater zero signed doublets 


G.SET.G.Z.32 


Group set greater zero signed quadlets 


G.SET.G.Z.64 


Group set greater zero signed octlets 


G.SET.G.Z.128 


Group set greater zero signed hexlet 


G SET.GE.Z.8 


Group set greater equal zero signed bytes 


G SET.GE.Z.16 


Group set greater equal zero signed doublets 


G SET.GE.Z.32 


Group set greater equal zero signed quadlets 


G SET.GE.Z.64 


Group set greater equal zero signed octlets 


GSET GEZ.128 


Group set greater equal zero signed hexlet 


GSETLZ 8 


Group set less zero signed bytes 


GSETLZ 16 


Group set less zero signed doublets 


GSETLZ 32 


Group set less zero signed quadlets 


G SETLZ 64 


Group set less zero signed octlets 


G SETL Z 728 


Group set less zero signed hexlet 


G SET.LE.Z.8 


Group set less equal zero signed bytes 


G SET.LE.Z.16 


Group set less equal zero signed doublets 


G SETLEZ32 


Group set less equal zero signed quadlets | 


G SETLEZ64 


Group set less equal zero signed octlets 


G.SET.LE.Z128 


Group set less equal zero signed hexlet 


G.SET.NE.Z.8 


Group set not equal zero bytes 


G.SET.NE.Z.16 


Group set not equal zero doublets 


G.SET.NE.Z.32 


Group set not equal zero quadlets 


G.SET.NE.Z.64 


Group set not equal zero octlets 


G.SET.NE.Z.128 


Group set not equal zero hexlet 



Fig. 33A (cont'd) 



O OCT / C P 


GrouD set less eaual sianed bytes 


O CCT 1 F ifi 
b.ot I.Lt. 7 0 


GrouD set less eaual siqned doublets 


b.ot / .Lc.JZ 


Group set less equal signed quadlets 


O OCT 1 F fid 


Group set less equal signed octlets 


OCT 1 F 17R 


Group set less equal signed hexlet 


H QPT 1 F 11 R 


Group set less equal unsigned bytes 


n QPT 1 F II 1ft 
b. OC 1 . LC U. iO 


Group set less equal unsigned doublets 


b.OC / .LL.U.04 


Group set less equal unsigned quadlets 


O CCT I F II fid 


Group set less equal unsigned octlets 


1^ QPT 1 F 1 1 19R 
b.ot / .Lt.U. f^O 


Group set less equal unsigned hexlet 


b.ot / . b.o 


GrouD set sianed areater bytes 


CCT /2 -f P 

b.ot / .b.70 


Grnun set sianed areater doublets 


O CCT O 
b.ot 1 


GrouD set sianed areater auadlets 


fl CCT ^ P/< 

b.ot / .b.0*f 


Grouo set sianed areater octlets 


O CCT O 4 OP 
b.ot / .b. 7ZO 


QrniiD set sianed areater hexlet 


/•> cct n 1 1 n 
b.ot / .b.u.o 


Grouo set areater unsianed bvtes 

V^l w*Jiy WW* WtWWl*W. HI IWIM' IW w ¥ »ww 


G.SET.G.U.16 


Group set greater unsigned doublets 


G.SET.G.U.32 


Group set greater unsigned quadlets 


G.SET.G.U.64 


Group set greater unsigned octlets 


G.SET.G.U.128 


Group set greater unsigned hexlet 



G.SET.E.Z.size rd=rc 


ir- 


G.SET.AND.E.size rd=rc,rc j 


G.SET.G.Zsize rd=rc 


<=■ 


G.SET.L.U.size rd=rc,rc 


G.SET.GE.Z.size rd=rc 


<= 


G.SET.GE.size rd=rc,rc 


G.SET.LZ.size rd-rc 


<= 


G.SET.L.size rd=rc,rc 


G.SET.LE.Zsize rd=rc 


<= 


G.SET.GE.U.size rd=rc,rc 


G.SET.NE.Z.size rd=rc 


<- 


G.SET.AND.NE.size rd=rc,rc 


G.SET.G.size rd=rb,rc 


-> 


G.SET.L.size rd=rc,rb 


G.SET.G.U.sIze rd=rb,rc 


—> 


G.SET.L.U.size rd=rc,rb 


G.SET.LE.size rd=rb,rc 




G.SET.GE.size rd=rc,rb 


G.SET.LE.U.size rd=rb,rc 


-> 


G.SET.GE.U.size rd=rc,rb 



Fig. 33A (cont'd) 



Format 



G.op.size rd=rb,rc 
rd=gopsize(rb,rc) 

31 24 23 18 17 12 11 65 0 

I G.size I rd I re I rb I op I 

8 6 6 6 6 



Fig. 33B 



Definition 

def GroupReversed(op,size,rd,rc,rb) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
cas op of 
G.SUB: 

for i +- 0 to 128-size by size 

ai+size-1.j «- b i+size-1..i - Ci+size-1..i 
endfor 
G.SUB.L: 

for i <r- 0 to 128-size by size 

1 «- (bj +S j Z e-i || bj+size-1 ..i) - fa+size-1 II Cj+ S ize-1..i) 

aj+size-1..i «- Osize * *size-l) 7 (*size II *tK£l) : t S ize-1.. 
endfor 
G.SUB.LU: 

for i +- 0 to 128-size by size 

1 4- (0 1 || bj+size-U) • (0 1 || q+size-1..i) 
ai+size-1..i *- Csize * 0) ? 0 size : tsbe-i..o 
endfor 
G.SUB.O: 

for i <- 0 to 128-size by size 

t <- (bj+size-1 II bj+size-1 ..i) - (q+size-1 II q+size-1..i) 
if (tsize**size-l)then 

raise FixedPointArithmetic 

endif 

aj+size-1..i«-tsize-1..0 
endfor 
G.SUB.U.O: 

for i <- 0 to 128-size by size 

t <- (0 1 || bj+size-1 ..i) - (0. 1 || q+size-U) 
if (*size * 0) then 

raise FixedPointArithmetic 

endif 

ai+size-1..i<-tsize-1..0 
endfor 
G.SET.E: 

for i <- 0 to 128-size by size 

aj+size-U *- (bi+size-1..i = Cj+size-L.i) 812 ® 
endfor 
G.SET.NE: 

for i +- 0 to 1 28-size by size 

aj+size-1.J «- (bj+size-1..i * Cj+size-l.j) 8126 
endfor 
G.SET.AND.E: 

for i <- 0 to 128-size by size 

ai+size-U «- ((bj+size-1 ..i and q+ S lze-1..i) = 0) size 
endfor 

Fig. 33C 



G.SET.AND.NE: 

for i «- 0 to 128-size by size 

ai+size-l..i <- ((bi+size-1..i and q+ S ize-1..i) * 0) sce 
endfor 
G.SET.L: 

for i <- 0 to 1 28-size by size 

aj+size-1..i «- ((rc = rb) ? (bj +S j ze -l..i < 0) : (bj +S ize-1..i < q+size-1..i)) slze 
endfor 
G.SET.GE: 

for i <- 0 to 128-size by size 

ai+size-1..i «- ((re = rb) ? (bi +S lze-1..i * 0) : (bi+size-1..i * Cj+ S ize-1..i)) slze 
endfor 
G.SET.LU: 

for i <- 0 to 128-size by size 

ai+size-1 J «- ((rc = rb) ? (bj +S ize-1..i > 0) : 
((0 II b i+S i Z e.i..j) < (0 || q+size-U))) 8126 

endfor 
G.SET.GE.U: 

for i 0 to 128-size by size 

a i+S ize-1 ..i «- ((rc = rb) ? (bj +size -i j £ 0) : 
((0 || b^i^ j) 2> (0 || q+size-U))) 8126 

endfor 

endcase 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Fixed-point arithmetic 



Fig. 33C (cont'd) 



E.DIV.64 


Ensemble divide signed octlets 


E.DIV.U.64 


Ensemble divide unsigned octlets 


E.MUL.8 


Ensemble multiply signed bytes 


E.MUL16 


Ensemble multiply signed doublets 


E.MUL.32 


Ensemble multiply sighed quadlets 


E.MUL.64 


Ensemble multiply signed octlets 


E.MUL.SUM.8 


Ensemble multiply sum signed bytes 


E.MULSUM.16 


Ensemble multiply sum signed doublets \ 


E.MUL.SUM.32 


Ensemble multiply sum signed quadlets 


E.MUL.SUM.64 


Ensemble multiply sum signed octlets 


E.MUL.C.8 


Ensemble complex multiply bytes 


E.MULC.16 


Ensemble complex multiply doublets 


E.MUL.C.32 


Ensemble complex multiply quadlets 


E.MUL.M.8 


Ensemble multiply mixed-signed bytes 


E.MULM.16 


Ensemble multiply mixed-signed doublets 


E.MULM.32 


Ensemble multiply mixed-signed quadlets 


E.MUL.M.64 


Ensemble multiply mixed-signed octlets 


E.MUL.P.8 


Ensemble multiply polynomial bytes 


E.MUL.P.16 


Ensemble multiply polynomial doublets 


E.MUL.P.32 


Ensemble multiply polynomial quadlets 


E.MUL.P.64 


Ensemble multiply polynomial octlets 


E.MUL.SUM.C.8 


Ensemble multiply sum complex bytes 


E.MUL.SUM.C.16 


Ensemble multiply sum complex doublets 


E.MUL.SUM.C.32 


Ensemble multiply sum complex quadlets 


E.MUL.SUM.M.8 


Ensemble multiply sum mixed-signed bytes j 


E.MULSUM.M.16 


Ensemble multiply sum mixed-signed doublets 


E.MUL.SUM.M.32 


Ensemble multiply sum mixed-signed quadlets 


E.MULSUM.M.64 


Ensemble multiply sum mixed-signed octlets 


E.MULSUM.U.8 


Ensemble multiply sum unsigned bytes 


E.MULSUM.U.16 


Ensemble multiply sum unsigned doublets 


E.MUL.SUM.U.32 


Ensemble multiply sum unsigned quadlets 


E.MULSUM.U.64 


Ensemble multiply sum unsigned octlets 


E.MUL.U.8 


Ensemble multiply unsigned bytes 


E.MUL.U.16 


Ensemble multiply unsigned doublets 


E.MULU.32 


Ensemble multiply unsigned quadlets 


E.MUL.U.64 


Ensemble multiply unsigned octlets 



Fig. 34A 



Format 

E.op.size rd=rc,rb 
rd=eopsize(rc,rb) 

31" 24 23 18 17 12 11 65 0 

I E.size | rd | rc | rb | op 

8 6 6 6 6 



Fig. 34B 



D finition 

del fnul(size,h,vs.v,i,ws,wj) as 

mul«-((vs&v stee -i + i) h - size l|Vsize-1*l..i)'((ws&w S | 2 e.i +j r s,z II w S ize-1+j..j) 
endd f 

def c <- PolyMultiply(size.a,b) as 

PIOI^-O 2 * 8 " 26 
for k *- 0 to size-1 

p[k+1] <- pM * a k ? (0 size - k || b || 0 k ) : O 2 * 8126 

endfbr 
c 4- p[slze] 
nddef 

def EnsemWe(op,size t rd.rc,rb) 
c«-RegRead(rc128) 
b4-RegRead(rb, 128) 
case op of 

E.MUL:, E.MULC:, EMULSUM, E.MUL.SUM.C, E.CON, E.CON.C. E.DIV: 

cs 4- bs <- 1 
E.MUL.M:, EMULSUM.M, E.CON.M: 

CS4-0 

DS4-1 

E.MULU:, EMULSUM.U. E.CON.U, E.DIV.U, E.MULP: 

CS4- DS4- 0 

endcase 
case op of 

E.MUL, E.MULU. E.MUL.M: 

for i «- 0 to 64-size by size 

d2*(i+size)-1..2*i <~ nttJl(size t 2*size,cs,c,i,bs,b,i) 

endfor 
- E.MULP: 

for i 4- 0 to 64-size by size 

c*2*(i + size)-1..2*i «- PolyMuWply(slze ( p S | Z e-lHJ. b slze-1+i..i) 

endfor 
E.MULC: 

for i <- 0 to 64-size by size 
if (i and size) = 0 then 

p 4- mul(size,2*size,1,c,i,1.b,i) - muKsize,2*size,1,c,i+size,1,b,i+size) 



p 4- mul(size,2*size,1,c,i,1.b,i+size) + mu!(size,2*size,1,c,i,1,b,i+size) 
endif 

d2*(i+sizeM..2*i<-P 

endfor 

E.MULSUM, E.MULSUM.U, E.MULSUM.M: 
p[0]4-0 128 

for i 4- 0 to 128-size by size 

pp+size] 4- p[i] ♦ mul(size,128 f cs,c,i,bs.b.i) 

endfor 
a 4- p[128) 
E.MULSUM.C: 

PI0J4-0 64 

p[size] 4- 0 64 

for i 4- 0 to 128-size by size 
if 0 ano &ze) = 0 then 

pp4^*size) 4- p[»] + mul(size,64,1,c,i,1,b,i) 

- mul(size t 64,1 f c,i+size t 1 t b r i+size) 



pp+2*size] 4- ppl ♦ mu!(size,64 t 1,c,i,1.b.i+size) 

+ mul(size,64,1 ,c,i+size t 1 ,b,i) 

endif 

ndfor 

a 4- p[128+size] || p[128] 

Fig. 34C 



E.CON, E.CON.U, E.CON.M: 
pI0]<-0 128 

for J «<— 0 1 64-sizebysiz 

for i <- 0 to 64-size by siz 

pD+size] 2 *(i+ S ize)-1..2*i «- PDl2*(i+slz + 
mul(size,2*size,cs,c,i+64-| ( bs,bJ) 

endfor 

endfor 
a <- p[64] 

E.CON.C: 

p[0] <- 0 128 

for j «- 0 to 64-slze by size 

for i 4- 0 to 64-size by size 

if ((H) and j and size) = 0 then 

pD+size)2»(i+size)-1..2*i «- PlDrfl+sizeM.^i 
mul(size,2*size,1,cJ+64-j f 1 .b j) 

else 

pD+sizeJ2«(Ksize)-1..2*i «- PlD2*(i+size)-1..2*i 
mul(size t 2*size,1,cj+64-j+2*size,1,bj) 

endif 

endfor 

endfor 
a <- p[64] 

E.DIV: 

if (b = 0) or ( (c = (1||0 63 )) and (b = 1 64 ) ) then 
a <- undefined 

else 

q«-c/b 

r c - q*b 

a «- r 63..0 II P63..0 

endif 
E.DIV.U: 

if b = 0then 

a 4- undefined 

else 

q<-(0||c)/(0i|b) 
r^c-(0||qr(0||b) 
a «- f63..0 II ^63..0 

endif 

endcase 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

none 



Fig. 34C (cont'd) 



/-\ /-v/^» j AKir\ c o 

G.COM.AND.b.8 


fi m 1 1 rv rAmnaro onH pnital 7orft nx/tPQ 

oroup compare anu equdi £ciu uyico 


G.COM.AND.b.lo 


firm m mmnaro anH oni ol 7orn HminlptQ 


G.COM.ANU.b.o^ 


l^rni m rftmnaro anH poiiaI 7Prn nimHtpfc 
Oiuup isUllipdio dliu oqudi £J3\\J v^uavJicio 


G.COM.ANU.b.o4 


firm in romnaro anH oni is I 7prn octlptQ 
OlUUp vUIIipait? dliu c?qudi tciu VAsiiCsio 


c*r\Kh a Mr\ c a oq 
G.COM.ANU.b.l^o 


firm in rnmnarp anH ontifll 7 pro hpyfpt 
OiUUp LrUilipait? aliu cijuai 1 icAici 


a% ^/"\M AMR MC Q 

G.OUM.ANU.Nb.o 


r^mi in rnmnaro AnH nnt phiiaI 7Pro hvtp^ 
OIUUp LrUiiipdit? di ivj iiul cijuai tciu uyico 


G.OUM.AlNU.INIb.l 0 


r^mi m mmnaro and nnt phiiaI 7Prn rinuhlpt<» 
Olwup VA/iiipdic di iu 1 iv/i cv^uai *.ciu uv/uuicio 


G.CUM.AINU.Nt.o^ 


firm in romnaro anH not pniml 7Prn nilpHlptQ 
Oiuup VA/iiipdio diiVJ %i\Ji ov^udi tciu v|uauic?io 


G.COM.ANU.Nb.b4 


firm in r*nmnarp anH nnt pni ol 7Prn nptlptQ 


G.COM.AND.Nb.12o 


firm in rnmnaro onH nnt oni 10I 7Prn Hpylot 

oruup cuinpdre dnu nui cLjUcii zuiu iicaiui 


G.COM.b.o 


fir^M ir\ AAmnora aai 10I K\/toc 

oruup compare ocjuai uyit?o 


G.COM.b.16 


fi rr\ 1 1 r*\ AAmn^ra aaiioI Hai thiotc 

oroup compare equal uuuuieis 


G.COM.E.32 


fir<si m AAfrtAQPA Am 10I ni lonlotc 

oroup compare equal quauieis 


G.COM.E.64 


/^«p/>>i * r> AAntAQfA a ^11 iqI nr*tlcfro 

oroup compare equal ocueio 


G.COM.E.128 


oroup compare equal nexiei 


G.COM.GE.8 


oroup compare greater equal signea oyres 


G.COM.GE.16 


oroup compare greater equal signeo oouDieis 


G.COM.GE.32 


oroup compare greater equal signeo quaoiets 


G.COM.GE.64 


oroup compare greater equal signea octiets 


G.COM.GE.128 


Pmiin AA*v%r\APA ArAO^Ar qai ioI ciaaqH KavI 

oroup compare greater equal signeo nexiet 


G.COM.GE.U.o 


A. A . AAMinArA APAAtar qai tol i incinnoH K\/toc 

oroup compare greater equal unsigneu oytes 


G.COM.GE.IL16 


oroup compare greater equal unsigneu oouuiets 


G.COM.GE.U.32 


A»/m i AAWinnrA ^» ^% 4 r r\ r** I ■ lAC^lAA^^A Al lAAIATC 

oroup compare greater equal un signeo quaoiets 


G.COM.GE.U.64 


AMiin AArAAAPA APAAtAP A A 1 1 0 1 1 IACIAAaH nT*tlotC 

oroup compare greater equal unsignea octiets 


G.COM.GE.U.128 


PfAtIA AAWftAAP^A APOAtAP A Al 1 ol t IACIAAaH h A vl A^ 

oroup compare greater equal unsigneu nexiet 


G.COM.Lo 


oroup compare signeo less Dytes i 


G.COM.L16 


Ami ia AnmnAPA cIaaa/4 Iacp Hai ll^l A^O 

oroup compare signea less aouoiets 


G.COM.L.32 


oroup compare signea less quaoiets 


G.COM.L.64 


oroup compare signea less octiets 


G.COM.L.128 


PpAIIA AAHIAAPA f» IAAAA* 1 AI^C A Qvt At 

oroup compare signea less nexiet 


G.COM.L.U.8 


f*rAiiA aawiaapa Iaoa i tncinnoH K\/tfiC 

oroup compare less unsignea oytes 


G.COM.L.U.16 


oroup compare less unsignea aouoiets 


G.COM.L.U.32 


^r/M 1 A AAPA A APA IaaA lir*lCIAAAA Al lAAlATA 

oroup compare less unsignea quaoiets 


G.COM.LU.64 


oroup compare less unsignea octiets 


G.COM.LU.128 


oroup compare less unsignea nexiet 


AAii |l ir— a 

G.COM.NE.8 


^PAI IA AAPA A A P*A AA'f AAI IaI Kl/tAC 

oroup compare not equal Dytes 


ft POM MP 1fi 
O.OV-/IVI.INC. ID 


Groun comnare not eaual doublets 


G.COM.NE.32 


Group compare not equal quadlets 


G.COM.NE.64 


Group compare not equal octiets 


G.COM.NE.128 


Group compare not equal hexlet 



Fig. 35A 



Format 



G.COM.op.size rd.rc 
G.COM.opz.size red 

gcomopsize(rd.rc) 

31 24 23 18 17 12 11 65 0 

I G.size | rd | re I op j GCOM | 

8 6 6 6 6 



Fig. 35B 



Definition 

def GroupCompare(op,size,rd ( rc) 
d <- RegRead(rd, 128) 
c «- RegRead(rc, 128) 
case op of 

G.COM.E: 

for i 4- 0 to 128-size by size 

ai+size-1..i +- (dj+size-U = Cj+size-U) 5 * 0 
endfor 
G.COM.NE: 

for i 0 to 128-size by size 

ai+size-1..i «- (d|+size-1..i * q+sfce-u) 8 * 8 
endfor 
G.COM.AND.E: 

for i <- 0 to 128-size by size 

ai+size-1..l «- ((q+size-1..i and dj +S jze-1..i) = 0) slze 
endfor 
G.COM.AND.NE: 

for i <- 0 to 128-size by size 

aj+size-1..i «- ((q+size-1..l and dj+sfce-u) * 0) sfee 
endfor 
G.COM.L: 

for i <- 0 to 128-size by size 

ai+size-1..i «- ((rd = rc) ? (q +S ize-1J < 0) : (d i+S ize-1.J < Cj +S ize-1..0) slze 
endfor 
G.COM.GE: 

for i <- 0 to 128-size by size 

a i+S ize-1 ..i <- <(rd = rc) ? (q +S ize-1 ..i * 0) : (d j+siZ e-i . j 2> q +S ize-1 ..i)) size 
endfor 
G.COM.LU: 

for i <- 0 to 128-size by size 

aj+size-1..i <- ((rd = rc) ? (q+ S ize-1..i > 0) : 
((0 II d+sbe-u) < (0 H c j+S ize-1..i))) slze 

endfor 
G.COM.GE.U: 

for i ^- 0 to 128-size by size 

a j+size-1 ..i +~ ((rd = rc) ? (q +S fee-1 ..i * 0) : 
((0 II dj +siZ e-i..i) * (0 1| q+size-u))) 5126 

endfor 

endcase 
if (a * 0) then 

raise FixedPointArithmetic 

endif 
encidef 



Exceptions 

Fixed-point arithmetic 



Fig.35C 



E LOG MOST.8 


Ensemble log of most significant bit signed bytes 


E L0G.M0ST.16 


Ensemble log of most significant bit signed doublets 


E LOG.MOST.32 


Ensemble log of most significant bit signed quadlets 


E.LOG.MOST.64 


Ensemble log of most significant bit signed octlets 


E.LOG.MOST.128 


Ensemble log of most significant bit signed hexlet 


E L0G.M0ST.U.8 


Ensemble log of most significant bit unsigned bytes 


E LOG MOST U 16 


Ensemble log of most significant bit unsigned doublets 


E LOG MOST U 32 


Ensemble log of most significant bit unsigned quadlets 


E LOG MOST U 64 


Ensemble log of most significant bit unsigned octlets 


E LOG MOST U 128 


Ensemble log of most significant bit unsigned hexlet 


E SUM 8 


Ensemble sum signed bytes 


E SUM 16 


Ensemble sum signed doublets 


E SUM 32 


Ensemble sum signed quadlets 


E.SUM.64 


Ensemble sum signed octlets 


E.SUM.U.1 


Ensemble sum unsigned bits 


E.SUM.U.8 


Ensemble sum unsigned bytes 


E.SUM.U.16 


Ensemble sum unsigned doublets 


E.SUM.U.32 


Ensemble sum unsigned quadlets 


E.SUM.U.64 


Ensemble sum unsigned octlets 



Selection 



class 


op 


size 


sum 


SUM 


8 16 32 64 


SUM.U 


1 8 16 32 64 


log most 
significant bit 


LOG.MOST LOG.MOST.U 


8 16 32 64 128 : 



Fig. 36A 



Format 



E.op.size rd=rc 
rd=eopsize(rc) 

31 24 23 18 17 12 11 6 5 0 

I E.size I rd I rc I op I E.UNARY | 

8 6 6 6 6 



Fig. 36B 



Definition 



def EnsembleUnary(op,size,rd,rc) 
c <- RegRead(rc, 128) 
case op of 

E.LOG.MOST: 

for i <- 0 to 128-size by size 
if (cj+size-U =0 ) 

a i+size-1..i <- "1 

else 

for j <- 0 to size-1 

■f Csbe-1+L.j+i = (4&tVh II not c size-1+l) ^en 
aj+size-1..i<-j 

endif 
endfor 

endif 
endfor 
E.LOG.MOSTU: 

for i <- 0 to 1 28-size by size 

if (Ci+size-1..i = 0)then 

ai+size-1..i<~-1 

else 

for j to size-1 

if Csize-1+l..j+i = (0 size -H || 1) then 
ai+size-1..i«-j 

endif 
endfor 

endif 
endfor 
E.SUM: 

p[0]<-0 1 28 

for i 4- 0 to 1 28-size by size 

p[i+size] <- p[i] + (c|2|^fee || Csfce-1+Li) 
endfor 
a<-p[128] 
E.SUMU: 

p[0]<-0 128 

for i <- 0 to 128-size by size 

pp+size] <- p[i] + (0128-size y c si2 e-i +U ) 
endfor 
a<-p[128] 

endcase 

RegWrite(rd f 128, a) 
nddef 

Exceptions 

none 



Fig. 36C 



Floating-point function Definitions 

def eb <- ebits(prec) as 
case pref of 



16: 






eb<-5 


32: 






eb<-8 


64: 






eb<-11 


128: 






eb*-15 



endcase 
nddef 

def eb <- ebias(prec) as 

eb<-0|| iebits(precH 
enddef 

def fb «- fbits(prec) as 
fb «- prec - 1 - eb 
nddef 

def a <- F(prec, ai) as 
a.s a^prec-1 
ae <- ai p rec-2..fbits(prec) 

af^aifbits(prec)-1..0 
tfae=1 ebits(prec) then 

ifaf = Othen 

a.t <- INFINITY 
elseif affbits(prec)-1 then 

a.t <- SNaN 

a.e <- -fbits(prec) 

a.f*-1 II affbits(prec)-2..0 

else 

a.t <- QNaN 
a.e «- -fbits(prec) 
a.f 4- af 

endif 

Fig. 37 



Iseif ae = 0 then 
if af = Othen 

a.t 4- ZERO 

else 

a.t 4- NORM 

a.e 4- 1-ebias(prec)-fbits(prec) 
a.f4-0||af 

endif 

else 

a.t 4- NORM 

a.e 4- ae-ebias(prec)-fbits(prec) 
a.f4-1 || af 

endif 
enddef 

def a <- DEFAULTQNAN as 

a.s 4-0 

a.t 4- QNAN 

a.e 4- -1 

a.f4-1 
enddef 

def a 4- DEFAULTSNAN as 

a.s 4-0 

a.t 4- SNAN 

a.e 4- -1 

a.f4-1 
enddef 

def fadd(a.b) as faddr(a,b,N) enddef 

def c 4- faddr(a,b,round) as 

if a.t=NORM and b.t=NORM then 

// d,e are a,b with exponent aligned and fraction adjusted 
if a.e > b.e then 
d 4- a 
e.t4-b.t 
e.s 4- b.s 
e.e 4- a.e 

e.f4-b.f||0 a ^ be 
else if a.e < b.e then 
d.t 4- a.t 
d.s 4- a.s 
d.e 4- b.e 

d.f4-a.f|| o b *- ae 
e4- b 

endif 
at 4- d.t 
c.e 4- d.e 
if d.s = e.s then 

c.s 4- d.s 

c.f 4-d.f + e.f 
elseif d.f >e.f then 

c.s 4- d.s 

c .f<-d.f-e.f 



Fig. 37 (cont'd) 



elseif d.f < e.f then 
as <- .s 
af<-e.f-d.f 

else 

c.s 4- r=F 
c.t <- ZERO 

endif 

// priority is given to b operand for NaN propagation 
elseif (b.t=SNAN) or (b.t=QNAN) then 
c <- b 

elseif (a.t=SNAN) or (a.t=QNAN) then 
c <- a 

elseif a.t=ZERO and b.t=ZERO then 
at <- ZERO 

as <- (a.s and b.s) or (round=F and (a.s or b.s)) 
// NULL values are like zero, but do not combine with ZERO to alter sign 
elseif a.t=ZERO or a.t=NULL then 

c <- b 

elseif b.t=ZERO or b.t=NULL then 
c <— a 

elseif a.t=INFINITY and b.t=INFINITY then 
if a.s * b.s then 

c DEFAULTSNAN // Invalid 

else 

Cf-a 

endif 

elseif a.t=INFINITY then 
c«-a 

elseif b.t=INFINITY then 
c*-b 

else 

assert FALSE // should have covered al the cases above 

endif 
enddef 

def b <- fneg(a) as 

b.s <- -a.s 

b.t <- a.t 

b.e <- a.e 

b.f<-a.f 
enddef 

def fsub(a,b) as fsubr(a,b t N) enddef 

def fsubr(a,b,round) as faddr(a,fneg(b),round) enddef 

def frsub(a,b) as frsubr(a t b,N) enddef 

def frsubr(a,b,round) as faddr(fheg(a),b,round) enddef 

def c <- fcom(a,b) as 

if (a.t=SNAN) or (a.t=QNA» i) or (b.t=SNAN) or (b.t=QNAN) then 
c<-U 

elseif a.t=INFINITY and b.t=INFINITY then 
if a.s * b.s then 

c <- (a.s=0) ? G: L 

Fig. 37 (cont'd) 



Ise 

C4-E 

endif 

elseif a.t=INFINITY then 
c 4- (a.s=0) ? G: L 
Iseifb.t^lNFINITYthen 

c<-(b.s=0)?G:L 
elseif a.t=NORM and b.t=NORM then 
if a.s * b.s then 

c 4- (a.s=0) ? G: L 

else 

if a.e > b.e then 
af <- a.f 

bf<-b.f|| O ae - be 

else 

af 4- a.f || o b ^ ae 
bf<-b.f 

endlf 

ifaf=bfthen 

C4-E 

else 

C4-((a.s=0) A (af>bf))?G:L 

endif 

endif 

elseif a.t=NORM then 

c 4- (a.s=0) ? G: L 
elseif b.t=NORM then 

C4-(b.s=0)?G:L 
elseif a.t=ZERO and b.t=ZERO then 

C4-E 

else 

assert FALSE // should have covered al the cases above 

endif 
enddef 

def c «- fmul(a,b) as 

if a.t=NORM and b.t=NORM then 

c.s 4- a.s A b.s 

at 4- NORM 

c.e <- a.e + b.e 

c.f<-a.f*b.f 
// priority is given to b operand for NaN propagation 
elseif (b.t=SNAN) or (b.t=QNAN) then 

c.s 4- a.s A b.s 

c.t4-b.t 

c.e 4- b.e 

c.f*-b.f 

elseif (a.t=SNAN) or (a.t=QNAN) then 
c.s 4- a.s A b.s 
c.t 4- a.t 
c.e 4- a.e 
c.f 4- a.f 

elseif a.t=ZERO and b.t=INFIIMITY then 

c 4- DEFAULTSNAN // Invalid 
elseif a.t=INFINITY and b.t=ZERO then 

c 4- DEFAULTSNAN // Invalid 



Fig. 37 (cont'd) 



elseif a.t=ZERO or b.t=ZERO then 
c.s «- a.s A b.s 
c.t <- ZERO 

else 

assert FALSE // should have covered al the cases abov 

endrf 
enddef 

def c <- fdlvr(a f b) as 

if a.t=NORM and b.t=NORM then 
c.s <- a.s A b.s 
c.t <- NORM 
c.e <- a.e - b.e + 256 

c.f<-(a.f|| O 256 )^ 
// priority is given to b operand for NaN propagation 
elseif (b.t=SNAN) or (b.t=QNAN) then 

c.s <- a.s A b.s 

c.t<-b.t 

c.e <- b.e 

c.f<-b.f 

elseif (a.t=SNAN) or (a.t=QNAN) then 
c.s <- a.s A b.s 
c.t <- a.t 
c.e <- a.e 
c.f «- a.f 

elseif a.t=ZERO and b.t=ZERO then 

c <- DEFAULTSNAN // Invalid 
elseif a.t=INFINITY and b.t=INFINITY then 

c <- DEFAULTSNAN // Invalid 
elseif a.t=ZERO then 

c.s <- a.s A b.s 

c.t «- ZERO 
elseif a.t=INFINITY then 

c.s *- a.s A b.s 

c.t <- INFINITY 

else 

assert FALSE // should have covered al the cases above 

endif 
enddef 

def msb <- findmsb(a) as 

MAXF <- 2 18 // Largest possible f value after matrix multiply 
forj<-OtoMAXF 

if aMAXM.j ■ (O 1 ^^ 1 ^ H 1) then 
msb j 

endrf 
endfor 
nddef 

def ai <- PackF(prec l a,round) as 
case a.t of 
NORM: 

msb <- findmsb(a.f) 

m <- msr>1-fbits(prec) // Isb for normal 

rdn <- -ebias(prec)-a.e-1-fbits(prec) // Isb if a denormal 

rb 4- (m > rdn) ? m : rdn 



Fig. 37 (cont'd) 



if rb £ 0 then 

aifr<-a.f msb -i..o HO"* 
adj<-0 

Ise 

case round of 

s <- o m8b "* || (-a.s)* 

F: 

s <- omsb-ib || ( a .s)rt> 
N, NONE: 

s^O msb - rb ||-a.f rt) ||a.f^ 1 

X: 

if a f rt>-1 ..0*0 then 

raise Floating PointArithmetic // Inexact 

endif 
s <- 0 

Z: 

s«-0 

endcase 

v^(0||a.f ms b..o) + (0||s) 
■fvmsb = 1 then 

aifr^v ms b.i..rb 

eadj <- 0 

else 

aifr^O^tP^) 
eadj <- 1 

endif 

endif 

aien <- a.e + msb - 1 + eadj + ebias(prec) 
if aien z 0 then 

if round - NONE then 

ai <- a.s || o ebfts (P rec > || aifr 

else 

raise FloatingPointArithmetic //Underflow 

endif 

elseif aien £ iebits(prec) 
if round = NONE then 

//default round-to-nearest overflow handling 
ai <- a.s || i^bits(prec) || Qfbits(prec) 

else 

raise FloatingPointArithmetic //Underflow 

endif 

else 

ai *- a.s || aien e bits(prec)-1..0 H aifr 

endif 
SNAN: 

if round * NONE then 

raise FloatingPointArithmetic //Invalid 

endif 

if -a.e < fbits(prec) then 

ai <- a.s || isbits(prec) || a.f. a .e-1..0 II 0** 8 0 MBC )* a ' e 

Fig. 37 (cont'd) 



else 

Isb <- a.f. a .e-1-fbits(prec)+1..0 * 0 

ai <- a.s || 1 bits(prec) , a Wl..-a.o-1-fbH8(prec)*2 II Isb 

endif 
QNAN: 

if -a.e < fbits(prec) then 

ai <- a.s || iebits(prec) || a.f. a .e-i..o II O fbits ft >rec ) +a e 

else 

Isb <r- a.f. a .e-1-fbits(prec)+1..0 * 0 

ai*- a.s || lebits(prec) g aWl..-a.e-14bits(prec)+2 II Isb 

endif 
ZERO: 

ai a.s || o ebits (P rec ) || 0 fbits (P rec > 
INFINITY: 

ai <- a.s || lebits(prec) || 0 fbits(prec) 

endcase 
defdef 

def ai <- fsinkr(prec, a, round) as 
case a.t of 
NORM: 

msb <- findmsb(a.f) 
rb <- -a.e 
if rb £ 0 then 

aifr^a.f msb ..ollO- rt> 
aims <- msb - rb 

else 

case round of 
C, CD: 

s ^ 0 msb-rb||^ als) rb 

F, F.D: 

s <- Q™t>-rt> || (ai.s)* 
N, NONE: 

s <- Omsk-* || -ai.frb II ai.ffc 1 

X: 

if ai.frt)-i„o* othe . n 

raise FloatingPointArithmetic // Inexact 

endif 
s <- 0 
Z, Z.D: 

s <- 0 

endcase 

V4-(0||a.f ms b..0) + (0lls) 
if v msb = 1 frsn 

aims <- msb + 1 - rb 

else 

aims «- msb - rb 

endif 

aifr ^- v a | ms ..rt) 

endif 

if aims > prec then 
case round of 

CD, F.D, NONE, Z.D: 

ai <- a.s || (-asjP"^ 1 

Fig. 37 (c nfd) 



C. F, N, X, Z: 

rais FloatingPointArithmetic // Overflow 

ndcase 
elseif a.s = 0 then 
ai <- aifr 

else 

ai «- -aifr 

endrf 
ZERO: 

ai *- 0P rec 
SNAN, QNAN: 

case round of 

CD, F.D, NONE, Z.D: 

ai<-0P rec 
C, F, N,X, Z: 

raise FloatingPointArithmetic // Invalid 

endcase 
INFINITY: 

case round of 

CD, F.D, NONE, Z.D: 

ai <- a.s || (-as)P rec - 1 
C, F, N,X,Z: 

raise FloatingPointArithmetic // Invalid 

endcase 

endcase 
enddef 



def c <- frecrest(a) as 
b.s*-0 
b.t <- NORM 
b.e<-0 
b.f*-1 

c<-fest(fdiv(b,a)) 
nddef 

def c «- frsqrest(a) as 
b.s 0 
b.t <- NORM 
b.e«-0 
b.f<-1 

c «- fest(fsqr(fdiv(b,a))) 
nddef 

def c «- fest(a) as 

if (a.t=NORM)then 

msb «- findmsb(a.f) 
a.e <- a.e + msb - 13 
af«-a.fmsb..msb-12ll 1 

else 

c <- a 

endif 
enddef 

def c <- fsqr(a) as 

if (a.t=NORM) and (a.s=0) then 
c.s«-0 
ct«-NORM 
if(a.eo = 1)then 

Fig. 37 (cont'd) 



c. <-(a.e-127)/2 
c.f <-sqr(a.f||0 127 ) 

els© 

c. <-(a.e-128)/2 
c.f<-sqr(a.f|| 0 128 ) 

endif 

elseif (a.t=SNAN) or (a.t=QNAN) or a.t=ZERO or ((a.t=INFINITY) and (a.s=0)) then 

C 4—* a 

elseif ((a.t=NORM) or (a.t=INFINITY)) and (a.s=1) then 
c <- DEFAULTSNAN // Invalid 

else 

assert FALSE // should have covered al the cases above 

endif 
enddef 

Fig. 37 (cont'd) 



E.ADD.F.16 


Ensemble aoo Tioating-poini nan 


E.ADD.F.16.C 


CncAmhla oHrl flr.atinn-nr»int half PPilinn 
cnsernDie auU nUdlliiy-pwiiii nan ucinuy 


E.ADD.F.16.F 


CnpomKfo oHH flr*of inn-rv.int half flnnr 

tnsernDie auu iioaung-puiiu iiaii nuui 


E.ADD-F.16.N 


CncAmKlA qHH flf>otinn_r\rvnt half noarPQt 

bnsemDie auu Hoaiing-puini r icui ncdicdi 


E.ADD.F.16.X 


CncAmKIa nr\r\ flr\otinrt_r\oint Half PY3Pt 

tnsemuie aoo noaiing-puiiu iicim cacioi 


E.ADD.F.16.Z 


Ensemble aaa Tioaiing-poini nan zero 


E.ADD.F.32 


Ensemble add floating-point smgie 


E.ADD.F.32.C 


Ensemble add floating-point smgie ceiling 


E.ADD.F.32.F 


Ensemble add floating-point smgie noor 


E.ADD.F.32.N 


ensemble add floating-point smgie nearest 


E.ADD.F.32.X 


Ensemble add floating-point smgie exact 


E.ADD.F.32.Z 


Ensemble add floating-point single zero 


E.ADD.F.64 


Ensemble add floating-point double 


E.ADD.F.64.C 


Ensemble add floating-point double ceiling 


E.ADD.F.64.F 


Ensemble add floating-point double floor 


^» A P^ A a A t 

E.ADD.F.64.N 


— _ i i _ _ J J flAoiiMM maim! /4#m il^l/s nA^PAPT 

Ensemble add floating-point double nearest 


E.ADD.F.64.X 


Ensemble add floating-point double exact 


E.ADD.F.64.Z 


Ensemble add floating-point double zero 


E.ADD.F.128 


Ensemble add floating-point quad 


E.ADD.F.128.C 


Ensemble add floating-point quad ceiling 


E.ADD.F.128.F 


Ensemble add floating-point quad floor 


E.ADD.F.128.N 


Ensemble add floating-point quad nearest 


E.ADD.F.128.X 


Ensemble add floating-point quad exact 


E.ADD.F.128.Z 


Ensemble add floating-point quad zero 


E.DIV.F.16 


Ensemble divide floating-point half 


E.DIV.F.16.C 


Ensemble divide floating-point half ceiling 


E.DIV.F.16.F 


Ensemble divide floating-point halt floor 


E.DIV.F.16.N 


_ - - - I - 1 - J' * _J ^ XI aa a4i«%M AAAv AWA I -MA 4 P-A ^% IX AA\/\rA^T 

Ensemble divide floating-point halt nearest 


E.DIV.F.16.X 


Ensemble divide floating-point hair exact 


m~ mm*, am g A ^% »«•> 

E.DIV.F.16.Z 


Ensemble divide floating-point halt zero 


E.DIV.F.32 


Ensemble divide floating-point single 


c ni\/ p 


Fn^pmhlp riividp flnatina-Doint sinale ceilino 


E.DIV.F.32.F 


Ensemble divide floating-point single floor 


E.DIV.F.32.N 


Ensemble divide floating-point single nearest 


E.DIV.F.32.X 


Ensemble divide floating-point single exact 


E.DIV.F.32.Z 


Ensemble divide floating-point single z^ro 


E.DIV.F.64 


Ensemble divide floating-point double 



Fig. 38A 



E.DIV.F.64.C 


Ensemble divide floating-point double ceiling 


E.DIV.F.64.F 


Ensembl divid floating-point double floor 


E.DIV.F.64.N 


Ensemble divide floating-point double nearest 


E.DIV.F.64.X 


Ensemble divide floating-point double exact 


E.DIV.F.64.Z 


Ensemble divide floating-point double zero 


E.DIV.F.128 


Ensemble divide floating-point quad 


E.DIV.F.128.C 


Ensemble divide floating-point quad ceiling 


E.DIV.F.128.F 


Ensemble divide floating-point quad floor 


E.DIV.F.128.N 


Ensemble divide floating-point quad nearest 


E.DIV.F.128.X 


Ensemble divide floating-point quad exact 


E.DIV.F.128.Z 


Ensemble divide floating-point quad zero 


E.MULC.F.16 


Ensemble multiply complex floating-point half 


E.MUL.C.F.32 


Ensemble multiply complex floating-point single 


E.MULC.F.64 


Ensemble multiply complex floating-point double 


E.MULF.16 


Ensemble multiply floating-point half 


E.MULF.16.C 


Ensemble multiply floating-point half ceiling 


E.MULF.16.F 


Ensemble multiply floating-point half floor 


E.MULF.16.N 


Ensemble multiply floating-point half nearest 


E.MUL.F.16.X 


Ensemble multiply floating-point half exact 


E.MUL.F.16.Z 


Ensemble multiply floating-point half zero 


E.MUL.F.32 


Ensemble multiply floating-point single 


E.MUL.F.32.C 


Ensemble multiply floating-point single ceiling 


E.MUL.F.32.F 


Ensemble multiply floating-point single floor 


E.MUL.F.32.N 


Ensemble multiply floating-point single nearest 


E.MUL.F.32.X 


Ensemble multiply floating-point single exact 


E.MUL.F.32.Z 


Ensemble multiply floating-point single zero 


E.MUL.F.64 


Ensemble multiply floating-point double 


E.MUL.F.64.C 


Ensemble multiply floating-point double ceiling 


E.MULF.64.F 


Ensemble multiply floating-point double floor 


E.MULF.64.N 


Ensemble multiply floating-point double nearest 


E.MUL.F.64.X 


Ensemble multiply floating-point double exact 


E.MUL.F.64.Z 


Ensemble multiply floating-point double zero 


E.MULF.128 


Ensemble multiply floating-point quad ] 


E.MUL.F.128.C 


Ensemble multiply floating-point quad ceiling 


E.MULF.128.F 


Ensemble multiply floating-point quad floor 


E.MULF.128.N 


Ensemble multiply floating-point quad nearest 


E.MULF.128.X 


Ensemble multiply floating-point quad exact 


E.MUL.F.128.Z 


Ensemble multiply floating-point quad zero 
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S lection 



place 




Dree 


round/traD 


add 


EADDF 


16 32 64 128 


noneCFNXZ 


divide 


EDIVF 


16 32 64 128 


none C F N X Z 


multiply 


EMULF 


16 32 64 128 


NONE C F N X Z 


complex multiply 


EMULC 
F 


16 32 64 


NONE 



Format 

E.op.prec.round rd=rc,rb 
rd=eopprecround(rc,rb) 

31 24 23 18 17 12 11 65 0 

I E.prec | rd | rc | rb | op.round~| 

8 6 6 6 6 



Fig. 38B 



Definition 

def mul(size f v f i,w j) as 

mul <- fimuKFCsize.Vsize-l+L.O.^siz .Wsize-1+j..j)) 
enddef 

def EnsembleFloatingPoint(op,prec t round/a f rb,rc) as 
c «- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
for i <- 0 to 128-prec by prec 
ci <- F(prec ( q +pre c-l.j) 
bi<-F(prec,bj + prec.l..i) 
case op of 

E.ADD.F: 

ai <- faddr(ci,bi,round) 
E.MULF: 

ai <- fmul(ci,bi) 
E.MULC.F: 

if (i and prec) then 

ai <- faddCmuKprec.c.i.b.i-prec), mul(prec,c,i-prec,b,i)) 

else 

ai <- fsub(mul(prec,c f l,b,l) f mul(prec,c,i + prec,b,i+prec)) 

endif 
E.DIV.F.: 

ai«-fdiv(ci,bi) 

endcase 

ai+prec-1..i «- PackF(prec ? ai f round) 
endfor 

RegWrite(rd f 128 f a) 
enddef 



Exceptions 

Floating-point arithmetic 



Fig. 38C 



Operation codes 



E.MUL.ADD.C.F.16 


Ensemble multiply add complex floating-point half 


E.MUL.ADD.C.F.32 


Ensemble multiply add complex floating-point single 


E.MUL.ADD.C.F.64 


Ensemble multiply add complex floating-point double 


E.MULADD.F.16 


Ensemble multiply add floating-point half 


E.MUL.ADD.F.16.C 


Ensemble multiply add floating-point half ceiling 


E.MUL.ADD.F.16.F 


Ensemble multiply add floating-point half floor 


E.MULADD.F.16.N 


Ensemble multiply add floating-point half nearest 


E.MUL.ADD.F.16.X 


Ensemble multiply add floating-point half exact 


E.MUL.ADD.F.16.Z 


Ensemble multiply add floating-point half zero 


E.MUL.ADD.F.32 


Ensemble multiply add floating-point single 


E.MUL.ADD.F.32.C 


Ensemble multiply add floating-point single ceiling 


E.MUL.ADD.F.32.F 


Ensemble multiply add floating-point single floor 


E.MUL.ADD.F.32.N 


Ensemble multiply add floating-point single nearest 


E.MUL.ADD.F.32.X 


Ensemble multiply add floating-point single exact 


E.MUL.ADD.F.32.Z 


Ensemble multiply add floating-point single zero 


E.MUL.ADD.F.64 


Ensemble multiply add floating-point double 


E.MUL.ADD.F.64.C 


Ensemble multiply add floating-point double ceiling 


E.MUL.ADD.F.64.F 


Ensemble multiply add floating-point double floor 


E.MUL.ADD.F.64.N 


Ensemble multiply add floating-point double nearest 


E.MUL.ADD.F.64.X 


Ensemble multiply add floating-point double exact 


E.MUL.ADD.F.64.Z 


Ensemble multiply add floating-point double zero 


E.MULADD.F.128 


Ensemble multiply add floating-point quad 


E.MUL.ADD.F.128.C 


Ensemble multiply add floating-point quad ceiling 


E.MUL.ADD.F.128.F 


Ensemble multiply add floating-point quad floor 


E.MUL.ADD.F.128.N 


Ensemble multiply add floating-point quad nearest 


E.MUL.ADD.F.128.X 


Ensemble multiply add floating-point quad exact 


E.MUL.ADD.F.128.Z 


Ensemble multiply add floating-point quad zero 


E.MULSUB.C.F.16 


Ensemble multiply subtract complex floating-point half 


E.MUL.SUB.C.F.32 


Ensemble multiply subtract complex floating-point single 


E.MULSUB.C.F.64 


Ensemble multiply subtract complex floating-point double 


E.MUL.SUB.F.16 


Ensemble multiply subtract floating-point half 


E.MUL.SUB.F.32 


Ensemble multiply subtract floating-point single 


E.MUL.SUB.F.64 


Ensemble multiply subtract floating-point double 


E.MUL.SUB.F.128 


Ensemble multiply subtract floating-point quad 



Fi?. 38D 



Sel ction 



class 


op 


type 


prec 


round/trap 


multiply add 


E.MUL.AD 
D 


F 


16 32 64 128 


noneCFNXZ 






C.F 


16 32 64 


NONE 


multiply subtract 


E.MULSU 
B 


F 


16 32 64 128 


NONE 






C.F 


16 32 64 


NONE 



Format 



E.op.size rd@rc,rb 
rd=eopsize(rd,rc,rb) 

31 24 23 18 17 12 11 65 0 

I E.size I rd | rc | rb | op | 

8 6 6 6 6 



Fig. 38E 



Definition 

def mul(size,v t i,w f j) as 

mul <- fmul(F(size,v S j ze .i + i..j),F(size l w S i Z e-i+j..j)) 
enddef 

def EnsemblelnplaceFloatingPoint(op,size t rd,rc,rb) as 
d <- RegRead(rd, 128) 
c RegRead(rc f 128) 
b <- RegRead(rb, 128) 
for i <- 0 to 128-size by size 

di<-F(prec,di +P rec-1.j) 
case op of 

E.MULADD.F: 

ai <- fadd(di, mul(prec,c f i,b,i)) 
E.MULADD.C.F: 

if (i and prec) then 

ai <- fadd(di, faddfmuKprec.c^b.i-prec), mul(c,i-prec,b,i))) 

else 

ai <- fadd(di, fsub(mul(prec,c t i,b,i) f mul(prec,c,i+prec,b,i+prec))) 

endif 
E.MUL.SUB.F: 

ai <- frsub(di, mul(prec,c,i,b,i)) 
E.MULSUB.C.F: 

if (i and prec) then 

ai <- frsub(di f faddfmuKpreccj.b.i-prec), mul(c f i-prec,b,i))) 

else 

ai <- frsub(di, fsubfmuKprecci.b.i), muKprec.cj+prec.b.i+prec))) 

endif 

endcase 

ai+prec-1..i «- PackF(prec, ai, round) 
endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

none 

Fig. 38F 



Operation codes 



E.SCALADD.F.16 


Ensemble scale add floating-point half 


E.SCAL.ADD.F.32 


Ensemble scale add floating-point single 


E.SCAL.ADD.F.64 


Ensemble scale add floating-point double 



Fig. 38G 



Selection 



class 


op 


prec 


scale add 


E.SCAL.ADD.F 


16 32 64 



Format 



E.SCALADD.F.size ra=rd,rc,rb 
ra=escaladdfsize(rd,rc t rb) 

31 24 23 18 17 12 11 65 

I op I rd | re | rb | ra 

8 6 6 6 6 



Fig. 38H 



Definition 

def EnsembleFloatingPointTernaryfop.prec.rd.rc.rb.ra) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc t 128) 
b <- RegRead(rb, 128) 
for i <- 0 to 128-prec by prec 

di<-F(prec,dj +pr ec-1..i) 

ci<-F(prec t Ci + p re c-i..i) 

ai <- fadd(fmul(di ( F(prec,bp re c-i..o)). fmul(ci, F(prec,b2* pr ec-1..prec))) 
ai+prec-U «- PackF(prec f ai, none) 
endfor 

RegWrite(ra, 128, a) 
enddef 

Exceptions 

none 



Fig. 38I 



E.SUB.F.16 


Ensemble subtract floating-point half 


E.SUB.F.16.C 


Ensemble subtract floating-point half ceiling 


E.SUB.F.16.F 


Ensemble subtract floating-point half floor 


E.SUB.F.16.N 


Ensemble subtract floating-point half nearest 


E.SUB.F.16.Z 


Ensemble subtract floating-point half zero 


E.SUB.F.16.X 


Ensemble subtract floating-point half exact 


E.SUB.F.32 


Ensemble subtract floating-point single 


E.SUB.F.32.C 


Ensemble subtract floating-point single ceiling 


E.SUB.F.32.F 


Ensemble subtract floating-point single floor 


E.SUB.F.32.N 


Ensemble subtract floating-point single nearest 


E.SUB.F.32.Z 


Ensemble subtract floating-point single zero 


E.SUB.F.32.X 


Ensemble subtract floating-point single exact 


E.SUB.F.64 


Ensemble subtract floating-point double 


E.SUB.F.64.C 


Ensemble subtract floating-point double ceiling 


E.SUB.F.64.F 


Ensemble subtract floating-point double floor 


E.SUB.F.64.N 


Ensemble subtract floating-point double nearest 


E.SUB.F.64.Z 


Ensemble subtract floating-point double zero 


E.SUB.F.64.X 


Ensemble subtract floating-point double exact 


E.SUB.F.128 


Ensemble subtract floating-point quad 


E.SUB.F.128.C 


Ensemble subtract floating-point quad ceiling 


E.SUB.F.128.F 


Ensemble subtract floating-point quad floor 


E.SUB.F.128.N 


Ensemble subtract floating-point quad nearest 


E.SUB.F.128.Z 


Ensemble subtract floating-point quad zero 


E.SUB.F.128.X 


Ensemble subtract floating-point quad exact 



Fig. 39A 



S lection 



class 


op 


prec 


round/trap 


set 


SET. 

E LG 
L GE 


16 32 64 128 


NONE X 


subtract 


SUB 


16 32 64 128 


NONE C F N X Z 



Format 



E.op.prec.rouhd rd=rb,rc 
rd=eopprecround(rb,rc) 

31 24 23 18 17 12 11 6 5 0 

I E.prec | rd | rc I rb | op. round | 

8 6 6 6 6 



Fig. 39B 



Definition 



def EnsembleReversedFloatingPoint(op,prec f round t rd t rc t rb) 
c<- RegRead(rc, 128) 
b<- RegRead(rb, 128) 
for i 4- 0 to 128-prec by prec 

ci«-F(prec,Cj +pre c-1..i) 

bi «- F(prec,bj+p re c-1j) 

ai <- frsubr(ci,-bi, round) 

ai+prec-1..i <- PackF(prec, ai, round) 
endfor 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Floating-point arithmetic 



Fig. 39C 



Operation codes 



G.SET.E.F.16 


oroup set equal Tioating-poini nan 


G.SET.E.F.16.X 


Group set equal floating-point half exact 


G.SET.E.F.32 


Group set equal floating-point single 


G.SET.E.F.32.X 


Group set equal floating-point single exact 


G.SET.E.F.64 


Group set equal floating-point double 


G.SET.E.F.64.X 


A^\ A 1 #1 *• • ■ J A ft A 

Group set equal floating-point double exact 


G.SET.E.F.128 


Group set equal floating-point quad 


G.SET.E.F.128.X 


Group set equal floating-point quad exact 


G.SET.GE.F.16.X 


Group set greater equal floating-point half exact 


G.SET.GE.F.32.X 


Group set greater equal floating-point single exact 


G.SET.GE.F.64.X 


Group set greater equal floating-point double exact 


^^X ^X «w p* ^ ^x «x x f 

G.SET.GE.F.128.X 


Group set greater equal floating-point quad exact 


G.SET.LG.F.16 


Group set less greater floating-point half 


^"X ^X | j«x M ^ ^x X t 

G.SET.LG.F.16.X 


Group set less greater floating-point half exact 


^^X 4*H I ^» 4X^X 

G.SET.LG.F.32 


Group set less greater floating-point single 


G.SET.LG.F.32.X 


Group set less greater floating-point single exact 


G.SET.LG.F.64 


Group set less greater floating-point double 


G.SET.LG.F.64.X 


Group set less greater floating-point double exact 


G.SET.LG.F.128 


Group set less greater floating-point quad 


G.SET.LG.F.128.X 


Group set less greater floating-point quad exact 


A^^ A 9 ^ P* | M * 

G.SET.L.F.16 


Group set less floating-point half 


G.SET.L.F.16.X 


Group set less floating-point half exact | 


^^X **X 1 *X J»X 

G.SET.L.F.32 


Group set less floating-point single 


G.SET.LF.32.X 


Group set less floating-point single exact 


CX QCT 1 P C>1 
o.oc 1 .L.r.DH 


(~1 rr\ 1 1 rx cot lace f!r%oti nn_nr\Int r\r\i iKIa 

oroup stfi less iioaung-poini oouDie 


G.SET.LF.64.X 


Group set less floating-point double exact 


G.SET.LF.128 


Group set less floating-point quad 


G.SET.LF.128.X 


Group set less floating-point quad exact 


G.SET.GE.F.16 


Group set greater equal floating-point half 


G.SET.GE.F.32 


Group set greater equal floating-point single 


G.SET.GE.F.64 


Group set greater equal floating-point double 


G.SET.GE.F.128 


Group set greater equal floating-point quad 



Fig. 39D 



Equivalencies 



/-\ c»ct i r r a c V 

G.Sc T Lc.r. T O.X 


^rni in cot lace o/iiiol flr»otinn_nrMnt half ovart 
OlUUp bul Icoo CljUal lIUdUny-pUM H flail CAdUl 


OCT ICC QO V 


f^rnim cpt I pee pniial flnatinn-nnint cinnlp pyart 


OCT ICC A A V 


r^rniin cpt Ipcc pniial flnatinrvnoint Hnuhlp PYact 


OCT ICC 4 oo V 

b.ot / .Lt.r. 7 ^o.X 


f^roitn cpt Ipcc pniial flnatinn-nnint miaH PYaf*t 


/"> OCT /"^ C «f 


f^rniin cpt nrpsfpr flnatinn-nnint half 
Oiuup oci yiwaici uuaui ly-pvii u nail 


oct c v 


f5rm in cpt nrpatpr flnatinn-nnint half PYact 
vjiuup owi yicaici iiuaui ly pun ii nan CAaui 


/""* OCT c oo 

G.SET.G.r.32 


oruup oci yicaitjr iiQduiiy-puini bif lyie 


OCT C OO V 

G.SET.G.F.32.X 


oroup sei greater Tioaung-poini single exact 


G.SET.G.F.64 


vj»roup sei greater Tioaung-poini oouDie 


G.SET.G.F.64.X 


oroup sei greaier noaung-puini aouuie exaci 


U.OCf .w.r . / i£0 


GrouD set areater floatina-Doint auad 


G.SET.G.F. 128.X 


Group set greater floating-point quad exact 


G.SET.LE.F.16 


Group set less equal floating-point half 


G.SET.LE.F.32 


Group set less equal floating-point single 


G.SET.LE.F.64 


Group set less equal floating-point double 


G.SET.LE.F.128 


Group set less equal floating-point quad 



G.SET.G.F.prec rd=rb,rc 


-> 


G.SET.LF.prec rd=rc f rb 


G. SET. G.F.precX rd=rb,rc 




G.SET.LF.prec.X rd=rc f rb 


G.SET.LE.F.prec rd=rb,rc 


-> 


G.SET.GE.F.prec rd=rc,rb } 


G.SET.LE.F.precX rd=rb,rc 


-> 


G.SET.GE.F.prec.X rd=rc,rb 



Fig. 39E 



Selection 



class 


op 


prec 


round/trap 


set 


SET. 
E LG 
L GE 
G LE 


16 32 64 128 


NONE X 



Format 



G.op.prec.round rd=rb,rc 
rc-gopprecround(rb.ra) 

31 24 23 18 17 12 11 65 0 

| G.prec | rd | rc | rb | op.round j 

8 6 6 6 6 



Fig 39F 



Definition 



def GroupFloatingPointReversedfop.prec/ound.rd.rc.rb) as 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
for i ^ 0 to 128-prec by prec 
ci^F(prec,Ci +P rec-1..i) 
bi4-F(prec > bj + p r ec.1..i) 
if round*NONE then 

if (di.t = SNAN) or (cLt = SNAN) then 
raise FloatingPointArithmetic 

endif 

case op of 

G.SET.LF, G.SET.GE.F: 

if (di.t = QNAN) or (ci.t = QNAN) then 
raise FloatingPointArithmetic 

endif 
others: //nothing 
endcase 

endif 

case op of 

G.SET.LF: 

ai «- bi?£ci 
G.SET.GE.F: 

ai <- bi!?<ci 
G.SET.E.F: 
ai <- bi=ci 
. G.SET.LG.F: 
ai <- bi#ci 

endcase 

ai+prec-1..i<-ai prec 
endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

Floating-point arithmetic 

Fig. 39G 



G.C0M.E.F.16 


Group compare equal floating-point half 


G.C0M.E.F.16.X 


Group compare equal floating-point half exact 


G.COM.E.F.32 


Group compare equal floating-point single 


G.COM.E.F.32.X 


Group compare equal floating-point single exact 


G.COM.E.F.64 


Group compare equal floating-point double 


G.COM.E.F.64.X 


Group compare equal floating-point double exact 


G.COM.E.F.128 


Group compare equal floating-point quad 


G.COM.E.F.128.X 


Group compare equal floating-point quad exact 


G.C0M.GE.F.16 


Group compare greater or equal floating-point half 


G.C0M.GE.F.16.X 


Group compare greater or equal floating-point half exact 


G.COM.GE.F.32 


Group compare greater or equal floating-point single 


G.COM.GE.F.32.X 


Group compare greater or equal floating-point single exact 


G.COM.GE.F.64 


Group compare greater or equal floating-point double 


G.COM.GE.F.64.X 


Group compare greater or equal floating-point double exact 


G.COM.GE.F.128 


Group compare greater or equal floating-point quad 


G.COM.GE.F.128.X 


Group compare greater or equal floating-point quad exact 


G.C0M.LF.16 


Group compare less floating-point half 


G.C0M.LF.16.X 


Group compare less floating-point half exact 


G.COM.LF.32 


Group compare less floating-point single 


G.COM.L.F.32.X 


Group compare less floating-point single exact 


G.COM.LF.64 


Group compare less floating-point double 


G.COM.LF.64.X 


Group compare less floating-point double exact 


G.COM.LF.128 


Group compare less floating-point quad 


G.COM.LF. 128.X 


Group compare less floating-point quad exact 


G.COM.LG.F.16 


Group compare less or greater floating-point half 


G.COM.LG.F.16.X 


Group compare less or greater floating-point half exact 


G.COM.LG.F.32 


Group compare less or greater floating-point single 


G.COM.LG.F.32.X 


Group compare less or greater floating-point single exact 


G.COM.LG.F.64 


Group compare less or greater floating-point double 


G.COM.LG.F.64.X 


Group compare less or greater floating-point double exact 


G.COM.LG.F.128 


Group compare less or greater floating-point quad 


G.COM.LG.F.128.X 


Group compare less or greater floating-point quad exact j 



Fig. 40A 



Format 



G.COM.op.prec.round rd.rc 
rc=gcomopprecround(rd,rc) 

31 24 23 18 17 12 11 6 5 0 

I G.prec | rd I rc | op | GCOM 1 

8 6 6 6 6 



Fig. 40B 



Definition 

def GroupCompareFloatingPointfop.prec.round.rd.rc) as 
d <- RegRead(rd. 128) 
c <- RegRead(rc, 128) 
for i <- 0 to 128-prec by prec 
di<-F(prec,dj +P rec-1..i) 
cif-FCprec.q+prec-l.j) 
if round*NONE then 

if (di.t = SNAN) or (ci.t = SNAN) then 
raise FloatingPointArithmetic 

end if 

case op of 

G.COM.LF, G.COM.GE.F: 

if (di.t = QNAN) or (ci.t = QNAN) then 
raise FloatingPointArithmetic 

endif 
others: //nothing 
endcase 

endif 

case op of 

G.COM.LF: 

ai <r- di?£ci 
G.COM.GE.F: 

ai <- di!?<ci 
G.COM.E.F: 

ai <r- di=ci 
G.COM.LG.F: 

ai 4- di*ci 

endcase 

ai+prec-1..i<-ai 
endfor 

if (a * 0) then 

raise FloatingPointArithmetic 

endif 
enddef 



Exceptions 

Floating-point arithmetic 



Fig. 40C 



E.ABS.F.16 


Ensemble absolute value floating-point half 


E.ABS.F.16.X 


Ensemble absolute value floating-point half exception 


E.ABS.F.32 


Ensemble absolute value floating-point single 


E.ABS.F.32.X 


Ensemble absolute value floating-point single exception 


E.ABS.F.64 


Ensemble absolute value floating-point double 


E.ABS.F.64.X 


Ensemble absolute value floating-point double exception 


E.ABS.F.128 


Ensemble absolute value floating-point quad 


E.ABS.F. 128.X 


Ensemble absolute value floating-point quad exception 


E.C0PY.F.16 


Ensemble copy floating-point half 


E.C0PY.F.16.X 


Ensemble copy floating-point half exception 


E.COPY.F.32 


Ensemble copy floating-point single 


E.COPY.F.32.X 


Ensemble copy floating-point single exception 


E.COPY.F.64 


Ensemble copy floating-point double 


E.COPY.F.64.X 


Ensemble copy floating-point double exception 


E.COPY.F.128 


Ensemble copy floating-point quad 


E.COPY.F. 128.X 


Ensemble copy floating-point quad exception 


E.DEFLATE.F.32 


Ensemble convert floating-point half from single 


E.DEFLATE.F.32.C 


Ensemble convert floating-point half from single ceiling 


E.DEFLATE.F.32.F 


Ensemble convert floating-point half from single floor 


E.DEFLATE.F.32.N 


Ensemble convert floating-point half from single nearest 


E.DEFLATE.F.32.X 


Ensemble convert floating-point half from single exact 


E.DEFLATE.F.32.Z 


Ensemble convert floating-point half from single zero 


E.DEFLATE.F.64 


Ensemble convert floating-point single from double 


E.DEFLATE.F.64.C 


Ensemble convert floating-point single from double ceiling 


E.DEFLATE.F.64.F 


Ensemble convert floating-point single from double floor 


E.DEFLATE.F.64.N 


Ensemble convert floating-point single from double nearest 


E.DEFLATE.F.64.X 


Ensemble convert floating-point single from double exact 


E.DEFLATE.F.64.Z 


Ensemble convert floating-point single from double zero 


E.DEFLATE.F.128 


Ensemble convert floating-point double from quad 


E.DEFLATE.F.128.C 


Ensemble convert floating-point double from quad ceiling 


E.DEFLATE.F.128.F 


Ensemble convert floating-point double from quad floor 


E.DEFLATE.F.128.N 


Ensemble convert floating-point double from quad nearest 


E.DEFLATE.F. 128.X 


Ensemble convert floating-point double from quad exact 


E.DEFLATE.F. 1 28.Z 


Ensemble convert floating-point double from quad zero 


E.FLOAT.F.16 


Ensemble convert floating-point half from doublets 


E.FLOAT.F.16.C 


Ensemble convert floating-point half from doublets ceiling 


E.FLOAT.F.16.F 


Ensemble convert floating-point half frc~i doublets floor 


E.FLOAT.F.16.N 


Ensemble convert floating-point half from doublets nearest 


E.FLOAT.F.16.X 


Ensemble convert floating-point half from doublets exact 


E.FLOAT.F.16.Z 


Ensemble convert floating-point half from doublets zero 



Fig.41A 



E FLOAT F 32 

W— • 1 mm* \m* 1 \ 1 .1 • Wb 


Ensemble convert floating-point single from quadlets 


E FLOAT F 32 C 


Ensemble convert floating-point single from quadlets ceiling 


E FLOAT F 32 F 


Ensemble convert floating-point single from quadlets floor 


E FLOAT F 32 N 


Ensemble convert floating-point single from quadlets nearest 


E.FLOAT.F.32.X 


Ensemble convert floating-point single from quadlets exact 


E.FLOAT.F.32 Z 


Ensemble convert floating-point single from quadlets zero 


E FLOAT F 64 


Ensemble convert floating-point double from octlets 


E FLOAT F 64 C 


Ensemble convert floating-point double from octlets ceiling 


E FLOAT F 64 F 


Ensemble convert floating-point double from octlets floor 


E FLOAT F 64 N 


Ensemble convert floating-point double from octlets nearest 


E FLOAT F 64 X 


Ensemble convert floating-point double from octlets exact 


E FLOAT F 64 Z 


Ensemble convert floating-point double from octlets zero 


E FLOAT F 128 


Ensemble convert floating-point quad from hexlet 


E FLOAT F 128 C 


Ensemble convert floating-point quad from hexlet ceiling 


E FLOAT F 128 F 


Ensemble convert floating-point quad from hexlet floor 


E FLOAT F 128 N 


Ensemble convert floating-point quad from hexlet nearest 


E FLOAT F 128 X 


Ensemble convert floating-point quad from hexlet exact 


E FLOAT F 128 7 


Ensemble convert floating-point quad from hexlet zero 


E INFLATE F 16 


Ensemble convert floating-point single from half 


E INFLATE F 16 X 


Ensemble convert floating-point single from half exception 


E INFLATE F 32 


Ensemble convert floating-point double from single 


E INFLATE F 32 X 


Ensemble convert floating-point double from single exception j 


E INFLATE F 64 


Ensemble convert floating-point quad from double 


E INFLATE F 64 X 


Ensemble convert floating-point quad from double exception 


E NEG F 16 

1mm, ,11 L. \mj . 1 * | \J 


Ensemble negate floating-point half 


E NEG F 16 X 


Ensemble negate floating-point half exception 


E NEG F 32 


Ensemble negate floating-point single 


E NEG F 32 X 


Ensemble negate floating-point single exception 


E NEG F 64 

l— • 1 * L. \mJ • 1 • \m*~ 


Ensemble negate floating-point double 


E NEG F 64 X 


Ensemble negate floating-point double exception 


E NEG F 128 


Ensemble negate floating-point quad 


E NEG F 128 X 


Ensemble negate floating-point quad exception 


E RECEST F 16 

UilAUVUU I.I. 1 \J 


Ensemble reciprocal estimate floating-point half 


E RECEST F 16 X 

L.IM.VLW I.I • IU.A 


Ensemble reciprocal estimate floating-point half exception 


E RECEST F 32 

• 1 \ ^mS mmm. \mJ 1 . | m \mt ^ 


Ensemble reciprocal estimate floating-point single 


E.RECEST.F.32.X 


Ensemble reciprocal estimate floating-point single exception 


E.RECEST.F.64 


Ensemble reciprocal estimate floating-point double 


E.RECEST.F.64.X 


Ensemble reciprocal estimate floating-point double exception 


E.RECEST.F.128 


Ensemble reciprocal estimate floating-point quad 


E.RECEST.F. 128.X 


Ensemble reciprocal estimate floating-point quad exception 



Fig. 41A (cont'd) 



E.RSQREST.F.16 


Ensemble floating-point reciprocal square root estimate half j 


E.RSQREST.F.16.X 


Ensemble floating-point reciprocal square root estimate half exact 


E.RSQREST.F.32 


Ensemble floating-point reciprocal square root estimate single 


E.RSQREST.F.32.X 


Ensemble floating-point reciprocal square root estimate single exact 


E.RSQREST.F.64 


Ensemble floating-point reciprocal square root estimate double 


E.RSQREST.F.64.X 


Ensemble floating-point reciprocal square root estimate double exact 


E.RSQREST.F.128 


Ensemble floating-point reciprocal square root estimate quad 


E.RSQREST.F.128.X 


Ensemble floating-point reciprocal square root estimate quad exact 


E.SINK.F.16 


Ensemble convert floating-point doublets from half nearest default 


E.SINK.F.16.C 


Ensemble convert floating-point doublets from half ceiling 


E.SINK.F.16.C.D 


Ensemble convert floating-point doublets from half ceiling default 


E.SINK.F.16.F 


Ensemble convert floating-point doublets from half floor 


E.SINK.F.16.F.D 


Ensemble convert floating-point doublets from half floor default 


E.SINK.F.16.N 


Ensemble convert floating-point doublets from half nearest 


E.SINK.F.16.X 


Ensemble convert floating-point doublets from half exact 


E.SINK.F.16.Z 


Ensemble convert floating-point doublets from half zero 


E.SINK.F.16.Z.D 


Ensemble convert floating-point doublets from half zero default 


E.SINK.F.32 


Ensemble convert floating-point quadlets from single nearest default 


E.SINK.F 32 C 


Ensemble convert floating-point quadlets from single ceiling 


E.SINK.F.32 C D 


Ensemble convert floating-point quadlets from single ceiling default 


E.SINK.F.32.F 


Ensemble convert floating-point quadlets from single floor 


E.SINK.F.32.F.D 


Ensemble convert floating-point quadlets from single floor default 


E.SINK.F.32.N 


Ensemble convert floating-point quadlets from single nearest 


E.SINK.F.32.X 


Ensemble convert ftoating-pQint quadlets from single exact 


E.SINK.F.32.Z 


Ensemble convert floating-point quadlets from single zero 


E.SINK.F.32.Z.D 


Ensemble convert floating-point quadlets from single zero default j 


E.SINK.F.64 


Ensemble convert floating-point octlets from double nearest default 


E.SINK.F.64.C 


Ensemble convert floating-point octlets from double ceiling 


E.SINK.F.64.C.D 


Ensemble convert floating-point octlets from double ceiling default 


E.SINK.F.64.F 


Ensemble convert floating-point octlets from double floor J 


E.SINK.F.64.F.D 


Ensemble convert floating-point octlets from double floor default 


E.SINK.F.64.N 


Ensemble convert floating-point octlets from double nearest 


E.SINK.F.64.X 


Ensemble convert floating-point octlets from double exact 


E.SINK.F.64.Z 


Ensemble convert floating-point octlets from double zero 


E.SINK.F.64.Z.D 


Ensemble convert floating-point octlets from double zero default 


E.SINK.F.128 


Ensemble convert floating-point hexlet from quad nearest default 


E.SINK.F.128.C 


Ensemble convert floating-point hexlet from quad ceiling 


E.SINK.F.128.C.D 


Ensemble convert floating-point hexlet from quad ceiling default j 


E.SINK.F.128.F 


Ensemble convert floating-point hexlet from quad floor 


E.SINK.F.128.F.D 


Ensemble convert floating-point hexlet from quad floor default 



Fig. 41A (cont'd) 



E.SINK.F.128.N 


Ensemble convert floating-point hexlet from quad nearest 


E.SINK.F.128.X 


Ensemble convert floating-point hexlet from quad exact 


E.SINK.F.128.Z 


Ensemble convert floating-point hexlet from quad zero 


E.SINK.F.128.Z.D 


Ensemble convert floating-point hexlet from quad zero default 


E.SQR.F.16 


Ensemble square root floating-point half 


E.SQR.F.16.C 


Ensemble square root floating-point half ceiling 


E.SQR.F.16.F 


Ensemble square root floating-point half floor 


E.SQR.F.16.N 


Ensemble square root floating-point half nearest 


E.SQR.F.16.X 


Ensemble square root floating-point half exact 


E.SQR.F.16.Z 


Ensemble square root floating-point half zero 


E.SQR.F.32 


Ensemble square root floating-point single 


E.SQR.F.32.C 


Ensemble square root floating-point single ceiling 


E.SQR.F.32.F 


Ensemble square root floating-point single floor 


E.SQR.F.32.N 


Ensemble square root floating-point single nearest 


E.SQR.F.32.X 


Ensemble square root floating-point single exact i 


E.SQR.F.32.Z 


Ensemble square root floating-point single zero 


E.SQR.F.64 


Ensemble square root floating-point double 


E.SQR.F.64.C 


Ensemble square root floating-point double ceiling 


E.SQR.F.64.F 


Ensemble square root floating-point double floor 


E.SQR.F.64.N 


Ensemble square root floating-point double nearest 


E.SQR.F.64.X 


Ensemble square root floating-point double exact 


E.SQR.F.64.Z 


Ensemble square root floating-point double zero 


E.SQR.F.128 


Ensemble square root floating-point quad 


E.SQR.F.128.C 


Ensemble square root floating-point quad ceiling 


E.SQR.F.128.F 


Ensemble square root floating-point quad floor 


E.SQR.F.128.N 


Ensemble square root floating-point quad nearest 


E.SQR.F.128.X 


Ensemble square root floating-point quad exact 


E.SQR.F.128.Z 


Ensemble square root floating-point quad zero 


E.SUM.F.16 


Ensemble sum floating-point half 


E.SUM.F.16.C 


Ensemble sum floating-point half ceiling 


E.SUM.F.16.F 


Ensemble sum floating-point half floor 


E.SUM.F.16.N 


Ensemble sum floating-point half nearest 


E.SUM.F.16.X 


Ensemble sum floating-point half exact 


E.SUM.F.16.Z 


Ensemble sum floating-point half zero 


E.SUM.F.32 


Ensemble sum floating-point single 


E.SUM.F.32.C 


Ensemble sum floating-point single ceiling 


E.SUM.F.32.F 


Ensemble sum floating-point single floor 


E.SUM..-32.N 


Ensemble sum floating-point single nearest 


E.SUM.F.32.X 


Ensemble sum floating-point single exact 


E.SUM.F.32.Z 


Ensemble sum floating-point single zero 



Fig. 41 A (cont'd) 



E.SUM.F.64 


Ensemble sum floating-point double 


E.SUM.F.64.C 


Ensemble sum floating-point double ceiling 


E.SUM.F.64.F 


Ensemble sum floating-point double floor 


E.SUM.F.64.N 


Ensemble sum floating-point double nearest 


E.SUM.F.64.X 


Ensemble sum floating-point double exact 


E.SUM.F.64.Z 


Ensemble sum floating-point double zero 


E.SUM.F.128 


Ensemble sum floating-point quad 


E.SUM.F.128.C 


Ensemble sum floating-point quad ceiling 


E.SUM.F.128.F 


Ensemble sum floating-point quad floor 


E.SUM.F.128.N 


Ensemble sum floating-point quad nearest 


E.SUM.F.128.X 


Ensemble sum floating-point quad exact 


E.SUM.F.128.Z 


Ensemble sum floating-point quad zero 



Selection 





op 


prec 


round/trap 


copy 


COPY 


16 32 64 128 


NONE X 


absolute 
value 


ABS 


16 32 64 128 


NONE X 


float from 
integer 


FLOAT 


16 32 64 128 


NONE C F N X Z 


integer 
from float 


SINK 


16 32 64 128 


NONE C F N X Z 
CD F.D Z.D 


increase 

format 

precision 


INFLATE 


16 32 64 


noneX 


decrease 

format 

precision 


DEFLATE 


32 64 128 


noneCFNXZ. 


negate 


NEG 


16 32 64 128 


noneX 


reciprocal 
estimate 


RECEST 


16 32 64 128 


noneX 


reciprocal 
square root 
estimate 


RSQREST 


16 32 64 128 


noneX 


square root 


SQR 


16 32 64 128 


none CFNXZ ! 


sum 


SUM 


16 32 64 128 


NONE C F N X Z 



Fig. 41 A (cont'd) 



Format 

r 

E.op.prec.round rd=rc 
rd=eopprecround(rc) 

31 24 23 18 17 , 12 11 65 0 

I E.prec | rd | rc | op | E.UNARY I 

8 6 6 6 6 



Fig. 41 B 



Definition 

def EnsembleUnaryFloatingPoint(op,pr c,round,rd,rc) as 
c <- RegRead(rc, 128) 
case op of 

E.ABS.F, E.NEG.F, E.SQR.F: 
for i 0 to 128-prec by prec 
cii-Ffprec.q+prec-lj) 
case op of 
E.ABS.F: 

ai.t <- ci.t 
ai.s 4- 0 
ai.e <- ci.e 
ai.f «- ci.f 
E.COPY.F: 
ai«-ci 
E.NEG.F: 

ai.t <- ci.t 
ai.s +~ -ci.s 
ai.e <- ci.e 
ai.f <- ci.f 
E.RECEST.F: 

ai *- frecest(ci) 
E.RSQREST.F: 

ai <r- frsqrest(ci) 
E.SQR.F: 

ai <- fsqr(ci) 

endcase 

ai+prec-1..i «- PackF(prec, ai, round) 
endfor 
E.SUM.F: 

p[0].t <- NULL 

for i ^- 0 to 1 28-prec by prec 

p[i+prec] <- fadd(p[i] f F(prec,Cj +pr ec-lj)) 
endfor 

a <- PackF(prec, p[128] t round) 
E.SINK.F: 

for i <- 0 to 128-prec by prec 

ci4-F(prec,q + prec.l..i) 

ai+prec-1..i <- fsinkr(prec, ci, round) 
endfor 
E.FLOAT.F: 

for i 4- 0 to 128-prec by prec 

ci.t <- NORM 

ci.e *- 0 

ci.s <- q+prec-1 

ci.f <- ci.s ? 1+~Cj +P rec-2..i : Ci+prec-2..i 
ai+prec-1 ..i «- PackF(prec, ci, round) 
endfor 



Fig. 41C 



E.INFLATE.F: 

for i 0 to 64-prec by prec 
ci«-F(pr c.Cj+prec-L.i) 

ai+i+prec+prec-1..i+i <- PackF(prec+prec, ci, round) 
endfor 
E.DEFLATE.F: 

for i 4- 0 to 128-prec by prec 

ci F(prec f Cj+ prec .ij) 

ai/2+prec/2-1..i/2 «- PackF(prec/2, ci, round) 
endfor 
3127..64 «- 0 

endcase 

RegWrite[rd, 128, a] 
enddef 

Exceptions 

Floating-point arithmetic 



Fig. 41C (cont'd) 



E.MUL.G.8 


Ensemble multiply Galois field byte 


E.MUL.G.64 


Ensemble multiply Galois field octlet 



Fig. 42A 



Format 

E.MUL.G.size ra=rd,rc,rb 
ra=emulgsize(rd,rc,rb) 

31 24 23 18 17 12 11 6 5 0 

|~E~MUL.G.size | rd | rc I rb | ra | 

8 6 6 6 6 



Fig.42B 



Definition 

def c <- PolyMultiply(size,a,b) as 

p[0] 4- 0 2 * size 

for k <- 0 to size-1 

p[k+1] <- p[k] A a k ? (0 size ~ k || b || 0 k ) : O 2 ^ 

endfor 

c +- p[size] 
enddef 

def c <- PolyResidue(size,a,b) as 
p[0] <- a 

for k <- size-1 to 0 by -1 

p[k+1] +- p[k] * p[0] si2 e + k ? (0 size - k I1 1 1 II b || 0 k ) : O^size 
endfor 

c«-p[size] S j ze -i..o 
enddef 

def EnsembleTemaryfop.size.rd.rc.rb.ra) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case op of 

E.MULG: 

for i <- 0 to 1 28-size by size 

a S ize-1 H j «- PolyResiduefsizePolyMuKsize.Csfce-i +j. .i.bsize-1 +i. .j),d S ize-1+Li) 
endfor 

endcase 

RegWrite(ra, 128, a) 
enddef 



Exceptions 

none 



Fig. 42C 



2047 



rc(1 28) 




i ffreg S9 OI3 S3 



i3 fc£J SS^ ESS 



128 



ra(128) o 
Ensemble multiply Galois field bytes 
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A.v<JIVinr\coo.Z 




A. VyV-/IVI r r\ C OO .H 


Oro^^har rnmnrp^Q cinnoH niHHIoc 

VI V99UOI wl 1 l^Ji 6g9 9IWI IC\J IHUUICO 


Y PHMPRPQQ A 
A . V-/ \J ivi n r\ c o o . o 


viudduai wUi I i^ji cod ol^HCU uyit?5> 


A.U V/M" rvCoo. 1 0 


f^rnQ^har mmnrocc cinnoH HmiHIotc 


y phmdrpcq 
A.OUIVlrrvcoo.o*: 


Hrncchflr romnrace cinnaH mioHlatc 

viudduai wunipruoo signsu quauieis 


Y PHMDDCCC GA 


u rosso a r cumpress signea ocuets 


A.UUIVIrKtoo.1^0 


urusbDar compress signea nexiet 


Y PHKilDDCOC 1 1 O 

A.UUMrKboo.U.^ 


urossDar compress unsigneo pecKs 


Y PriMDDCOC I I a 

A.UUIvlrKtoo.U.4 


urossDar compress unsigneo niDDies 


A.UUMrKboo.U.o 


urossDar compress unsigneo Dytes 


A.LUIvlrKboo.U.ib 


urossoar compress unsigneo doublets 


V PHMDDCCO 1 1 OO 


urossoar compress unsigneo quadlets 


v rnK^iDDcoo 1 1 ga 


urossDar compress unsigneo octlets 


A.UUMrKcoo.U.uo 


urossDar compress unsigneo nexiet 


V CYDAMn O 

A.bArANU./ 


orossDar expand signed pecks 


A.bArANU.4 


Crossbar expand signed nibbles i 


Y CYDAMH D 

A.bArANU.o 


urossoar expand signed bytes 


Y CYDAMH 4C 

A.bArAiNU. ID 


urossDar expand signed doublets 


Y CYDAMH OO 

A.bArANU.32 


Crossbar expand signed quadlets 


Y CYDAMH GA 

a . b Ar AIM U . 54 


urossDar expand signed octlets 


Y CVDAKIH 4 OO 

A. bAr AND. 1 28 


Crossbar expand signed hexlet 


Y CVDAKIH 1 1 O 

A.bArANU.U.2 


Crossbar expand unsigned pecks 


V CVDAKIH 1 1 A 

A.bArANU.U.4 


Crossbar expand unsigned nibbles 


Y CYDAMH 1 1 Q 
A.cArAINU.U.O 


urossoar expano unsigneo Dytes 


Y PYPAMn 1 1 1£ 
A.CArvMNU.U.lO 


Vsiuoouar expanu unsigneo oouDieis 


A.uArnlNU.U.Ot 


Oro^^Kpr <*Ynanrl nnctnnoH niiorllote 


X EXPAND I J 84 


Crossbar exoand tin^innprl nrtlotc 


X EXPAND U 128 


Crossbar expand unsianed hexlet 


X.R0TL.2 


Crossbar rotatp Ipft nprkc 


X ROTL 4 


Cros^har rntatA Ipft nihhloc 1 


X ROTL 8 


Cro^^hpr rotate loff h\/toc 


X ROTL 16 


Crosshar rotate laft Hm ihlotc 


X ROTL 32 


Crossbar rotatp Ipff nt tarllotc 


X.ROTL.64 


Crossbar rotate left octlets 


X. ROTL. 128 


Crossbar rotate left hexlet 


X.R0TR.2 


Crossbar rotate right pecks 


X.R0TR.4 


Crossbar rotate right nibbles 


X.R0TR.8 


Crossbar rotate right bytes 


X.R0TR.16 


Crossbar rotate right doublets 



Fig. 43 A 



X.ROTR.32 


Crossbar rotate right quadlets 


X.ROTR.64 


Crossbar rotate right octlets 


X.ROTR.128 


Crossbar rotate right hexlet 


X.SHL.2 


Crossbar shift left pecks 


X.SHL2.0 


Crossbar shift left signed pecks check overflow 


X.SHL.4 


Crossbar shift left nibbles 


X.SHL.4.0 


Crossbar shift left signed nibbles check overflow 


X.SHL.8 


Crossbar shift left bytes 


X.SHL.8.0 


Crossbar shift left signed bytes check overflow 


X.SHL16 


Crossbar shift left doublets 


X.SHL16.0 


Crossbar shift left signed doublets check overflow 


X.SHL32 


Crossbar shift left quadlets 


X.SHL.32.0 


Crossbar shift left signed quadlets check overflow 


X.SHL64 


Crossbar shift left octlets 


X.SHL.64.0 


Crossbar shift left sianed octlets check overflow 


X.SHL128 


Crossbar shift left hexlet 


X.SHL128.0 


Crossbar shift left signed hexlet check overflow 


X.SHLU.2.0 


Crossbar shift left unsiqned pecks check overflow 


X.SHL.U.4.0 


Crossbar shift left unsigned nibbles check overflow 


X.SHLU.8.0 


Crossbar shift left unsigned bytes check overflow 


X.SHL.U.16.0 


Crossbar shift left unsigned doublets check overflow 


X.SHL.U.32.0 


Crossbar shift left unsiqned auadlets check overflow 


X.SHL.U.64.0 


Crossbar shift left unsianed octlets check overflow 


X.SHLU.128.0 


Crossbar shift left unsigned hexlet check overflow 


X.SHR.2 


Crossbar signed shift right pecks 


X.SHR.4 


Crossbar signed shift right nibbles 


X.SHR.8 


Crossbar signed shift right bytes 


X.SHR.16 


Crossbar signed shift right doublets 


X.SHR.32 


Crossbar signed shift right quadlets 


X.SHR.64 


Crossbar signed shift right octlets 


X.SHR.128 


Crossbar signed shift right hexlet 


X.SHR.U.2 


Crossbar shift nght unsigned pecks 


X.SHR.U.4 


Crossbar shift right unsigned nibbles 


X.SHR.U.8 


Crossbar shift right unsigned bytes 


X.SHR.U.16 


Crossbar shift right unsigned doublets 


X.SHR.U.32 


Crossbar shift right unsigned quadlets 


X.SHR.U.64 | 


Crossbar shift right unsigned octlets | 


X.SHR.U.128 


Crossbar shift right unsigned hexlet 



Fig. 43A (cont'd) 



Selection 



class 


op 


size 


precision 


EXPAND EXPAND.U 
COMPRESS 

COMPRESS. 

U 


2 4 8 16 32 64 128 


shift 


ROTR ROTL SHR SHL 
SHL.O SHLU.O 
SHR.U 


2 4 8 16 32 64 128 



Format 

X.op.size rd=rc,rb 
rd=xopsize(rc,rb) 

31 252423 18 17 12 11 6 5 21 0 

I XSHIFT |s| rd | re | rb | op |sz] 

7 1 6 6 6 4 2 

Isize <- log(size) 
s <- Isize2 
sz<- lsizei..o 



Fig. 43B 



Definition 



def Crossbar(op,size t rd,rc,rb) 
c<- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
shift b and (size-1) 
case ops.,2 II 0 2 of 
X.COMPRESS: 
hsize <- size/2 

for i <— 0 to 64-hsize by hsize 
if shift £ hsize then 

ai+hsize-1..i <- cw+shift+hsize-1 J+i+shift 

else 

aj+hsize-1 ..i +- cf^!Psce?P II Q+i+size-1 J+i+shift 

endif 
endfor 
ai27..64<-0 
X.COMPRESS.U: 
hsize <- size/2 

for i <- 0 to 64-hsize by hsize 
if shift £ hsize then 

3i+hsize-1..i «- Ci+i+shift+hsize-1J+i+shift 

else 

ai + hsize-1.J «- O^ift-hsize || Cj +i+S ize-1.J+i+shm 

endif 
endfor 
ai27..64<-0 
X.EXP AND: 

hsize size/2 

for i <- 0 to 64-hsize by hsize 
if shift £ hsize then 

an+size-U+i «- cttfepP || ^ hsiz ^ j || (jshift 

else 

aw+size-1.>i «- Cj + size-shift-1..i || 0* hif * 

endif 
endfor 
X.EXP AND.U: 

hsize <- size/2 

for i 0 to 64-hsize by hsize 
if shift <, hsize then 

aw + size-1..W *- O hslz ^hift || q +h$ize . 1 , || 0* hif * 

else 

aj+i+size-U+i <- c l+sizMhrfrlB j || 0 shift 

endif 
endfor 
X.ROTL: 

for i <- 0 to 128-size by size 

ai+size-1..i <- Ci+size-1-shifU II Cj+ S ize-1..i+size-1-shift 
ndfor 



Fig. 43C 



X.ROTR: 

for i <- 0 to 1 28-siz by size 

ai+size-1 ..i *- Cj+ S hift-1 „i II Ci+size-1 ..i+shift 
endfor 
X.SHL: 

for i <r- 0 to 128-size by siz 

aj+size-1..i «- Cj +S ize-1 -shift. i II 0 shift 
endfor 
X.SHLO: 

for i 0 to 128-size by size 

if c i+S ize-1..i+size-1-shift * cp + h s ^i. shift ^en 
raise FixedPointArithmetic 

endif 

a|+size-1..i «- Cj+size-1-shift..ill 0 shjft 
endfor 
X.SHLU.O: 

for i <- 0 to 128-size by size 

if q+size-1 . J+size-shift * 0 shift then 
raise FixedPointArithmetic 

endif 

aj+size-1 ..i <- Cj+ S jze-i-shift..ill 0 shift 
endfor 
X.SHR: 

for i 4- 0 to 128-size by size 

aj+size-1 .J «- <f+ h s1ze-1 II c i+s»ze-1..»+shHt 
endfor 
X.SHR.U: 

for i 4- 0 to 128-size by size 

ai+size-U <- 0 shJft || q+size-1 J+shHt 
endfor 

endcase 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Fixed-point arithmetic 



Fig. 43C (cont'd) 




Compress 32 bits to 16, with 4-bit right shift 



Fig. 43D 



Operation codes 



Y QUI M O 


orosoDai on in ien merge pecKs 


y qui M d 

A.OnL.IVI.H 


f^rocchsir chiff loft morno niHHIoc 
viuooudi oi i it i ien meiye inuuieo 


Y QUI M ft 

/\. o n l. . i vi . o 


Prr^cchar chrff loft morno h\/foc 
viUdaUdi oi iii i idi iiieiye L/yieo 


Y QUI M 1 R 


Prncchar chift loft morno Hniihlofc 

uiuooudi of in i ien meiye uuuLHeio 


Y QUI km on 
A. o n L . 1 VI . Oc. 


Prncchar chrff loft 'mo mo mtorflotc 

uruooUai oniii ien merge quauieio 


Y ^Hl M R4 
A,OnL.IVI.v/*t 


Prncchar chrff loft morno nr*tlofc 

uruooudi oniri ien merge ucuei& 


Y QUI M lOA 


isrossoar snm ien merge nexiei 


Y QUP K/i O 
A.onrv.lvl.Z 


L/iossDar snnt ngm merge pecKS 


X SHR M 4 


Grosshar ^hHt rinht mpmt* nihhlpo. 

VlvwvUCII OI Jill 1 lyl 11 lllwiy^ IIIL/L/lwO 


X.SHR.M.8 


Crossbar shift right merge bytes 


X.SHR.M.16 


Crossbar shift right merge doublets 


X.SHR.M.32 


Crossbar shift right merge quadlets 


X.SHR.M.64 


Crossbar shift right merge octlets 


X.SHR.M.128 


Crossbar shift right merge hexlet 



Fig. 43E 



Format 



X.op.size rd@rc,rb 
rd=xopsize(rd,rc,rb) 

31 252423 18 17 12 11 6 5 21 0 

I XSHIFT |s| rd | rc I rb | op | sz | 

7 1 6 6 6 4 2 

Isize <- log(size) 
s <- Isize2 
sz*- lsizei..o 

Fig 43F 



Definition 

def Cro$sbarlnplace(op ( size,rd f rc,rb) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
shifts- band (size-1) 
for i 0 to 1 28-size by size 
case op of 
X.SHR.M: 

ai+size-1.J «- Ci+shift-1..i II dj+ S ize-1..i+shift 
X.SHLM: 

&i+she-1J *- d i+size-1-shifU II Cj+ S hitt-1..i 

endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

none 



Fig 43G 



Op ration codes 



X.COMPRESS.1.2 


Crossbar compress immediate signed pecks 


X.COMPRESS.1.4 


Crossbar compress immediate signed nibbles 


X.COMPRESS.1.8 


Crossbar compress immediate signed bytes 


X.COMPRESS.1.16 


Crossbar compress immediate signed doublets 


X.COMPRESS.I.32 


Crossbar compress immediate signed quadlets 


X.COMPRESS.I.64 


Crossbar compress immediate signed octlets 


X.COMPRESS.1.128 


Crossbar compress immediate signed hexlet 


X.COMPRESS.I.U.2 


Crossbar compress immediate unsigned pecks 


X.COMPRESS.I.U.4 


Crossbar compress immediate unsigned nibbles 


X.COMPRESS.I.U.8 


Crossbar compress immediate unsigned bytes 


X.COMPRESS.I.U.16 


Crossbar compress immediate unsigned doublets 


X.COMPRESS.I.U.32 


Crossbar compress immediate unsigned quadlets 


X.COMPRESS.I.U.64 


Crossbar compress immediate unsigned octlets 


X.COMPRESS.I.U.128 


Crossbar compress immediate unsigned hexlet 


X.EXPAND.I.2 


Crossbar expand immediate signed pecks 


X.EXPAND.I.4 


Crossbar expand immediate signed nibbles 


X.EXPAND.I.8 


Crossbar expand immediate signed bytes 


X.EXPAND.1.16 


Crossbar expand immediate signed doublets 


X.EXPAND.I.32 


Crossbar expand immediate signed quadlets 


X.EXPAND.I.64 


Crossbar expand immediate signed octlets 


X.EXPAND.1.128 


Crossbar expand immediate signed hexlet 


X.EXPAND.I.U.2 


Crossbar expand immediate unsigned pecks 


X.EXPAND.I.U.4 


Crossbar expand immediate unsigned nibbles 


X.EXPAND.I.U.8 


Crossbar expand immediate unsigned bytes 


X.EXPAND.I.U.16 


Crossbar expand immediate unsigned doublets 


X.EXPAND.I.U.32 


Crossbar expand immediate unsigned quadlets 


X.EXPAND.I.U.64 


Crossbar expand immediate unsigned octlets 


X.EXPAND.I.U.128 


Crossbar expand immediate unsigned hexlet 


X.ROTL.I.2 


Crossbar rotate left immediate pecks 


X.ROTL.I.4 


Crossbar rotate left immediate nibbles 


X.ROTL.1.8 


Crossbar rotate left immediate bytes 


X.ROTLI.16 


Crossbar rotate left immediate doublets 


X.ROTL.I.32 


Crossbar rotate left immediate quadlets 


X.ROTL.I.64 


Crossbar rotate left immediate octlets 


X.ROTL.1.128 


Crossbar rotate left immediate hexlet 


X.ROTR.I.2 


Crossbar rotate right immediate pecks 


X.ROTR.I.4 


Crossbar rotate right immediate nibbles 


X.ROTR.I.8 


Crossbar rotate right immediate by ies 


X.ROTR.1.16 


Crossbar rotate right immediate doublets 


X.ROTR.I.32 


Crossbar rotate right immediate quadlets 


X.ROTR.I.64 


Crossbar rotate right immediate octlets 


|X.ROTR.I.128 


Crossbar rotate right immediate hexlet 



Fig. 43H 



XSHLI2 


Crossbar shift left immediate pecks 


X.SHLI 2 0 


Crossbar shift left immediate signed pecks check overflow \ 


X.SHLI.4 


Crossbar shift left immediate nibbles 


X.SHLI.4.0 


Crossbar shift left immediate signed nibbles check overflow 


X.SHLI.8 


Crossbar shift left immediate bytes 


X.SHLI.8.0 


Crossbar shift left immediate signed bytes check overflow 


X.SHLI.16 


Crossbar shift left immediate doublets 


X.SHLI. 16.0 


Crossbar shift left immediate signed doublets check overflow 


X.SHLI.32 


Crossbar shift left immediate quadlets 


X SHL I 32 0 


Crossbar shift left immediate signed quadlets check overflow 


X SHL 1 64 


Crossbar shift left immediate octlets 


X SHL 1 64 0 


Crossbar shift left immediate signed octlets check overflow 


X SHL 1 128 


Crossbar shift left immediate hexlet 


X SHL 1 128 O 


Crossbar shift left immediate sianed hexlet check ovprflow 


X SHL 1 U 2 O 


Crossbar shift left immediate unsigned pecks check overflow 


X SHL 1 U 4 O 


Crossbar shift left immediate unsianed nibbles ehpck nvprfinw 

■ ********** mm* vi * » i *mw9 » i ■ ■ ii • i w v i w *w Wl lwl\Jl lv\J 1 MvUlww vl IWvi\ \^ V V^l 1 W 


X SHL 1 U 8 O 


Crossbar shift left immediate unsigned bytes check overflow 


X SHL I U 16 O 


Crossbar shift left immediate unsigned doublets check overflow 


X SHL 1 U 32 O 


Crossbar shift left immediate unsianed auadlets check ovprflnw 

w *****m***w *#iiii» v*mW9 % ii w 99 9 IV \*9 %m lv vMvlgilvy VJWW^JIWlw VI 1 WvV\ vf vl MvrV 


X SHL 1 U 64 O 


Crossbar shift left immediate unsigned octlets check overflow 


X SHL 1 U 128 O 


Crossbar shift left immediate unsigned hexlet check overflow 


X SHR 1 2 


Crossbar signed shift right immediate pecks 


X SHR 1 4 


Crossbar signed shift right immediate nibbles 


X.SHR 1 8 


Crossbar signed shift right immediate bytes 


X SHR 1 16 


Crossbar signed shift right immediate doublets 


X SHR 1 32 


Crossbar signed shift right immediate quadlets 


X SHR 1 64 


Crossbar signed shift right immediate octlets 


X.SHR 1 128 


Crossbar signed shift right immediate hexlet 


X.SHR 1 U 2 


Crossbar shift right immediate unsigned pecks 


X.SHR.I.U.4 


Crossbar shift right immediate unsigned nibbles 


X.SHR.I.U.8 


Crossbar shift right immediate unsigned bytes 


X.SHR.I.U.16 


Crossbar shift right immediate unsigned doublets 


X.SHR.I.U.32 


Crossbar shift right immediate unsigned quadlets 


X.SHR.I.U.64 


Crossbar shift right immediate unsigned octlets 


X.SHR.I.U.128 


Crossbar shift right immediate unsigned hexlet 



Fig. 43H (cont) 



Selection 



class 


op 


size 


precision 

- 


COMPRESS.I 

COMPRESS.I.U EXPAND.I 

CYDAMn 1 1 1 


2 4 8 16 32 64 128 


shift 


ROTL.I ROTR.I 
SHLI SHLI.O 
SHL.I.U.O 
SHR.I SHR.I.U 


2 4 8 16 32 64 128 


copy 


COPY 





Format 



X.op.size rd=rc,shift 
rd=xopsize(rc,shift) 

31 24 23 18 17 12 11 6 5 0 

I XSHIFTI | rd | rc | simm | op | 

8 6 6 6 6 

t 256-2*size+shift 
opi..o<-t 7 .. 6 
simm <- ts..o 



Fig. 43! 



Definition 

def CrossbarShortlmmediate(op,rd,rc,simm) 
case (opi..o II simm) of 



0 127* 






QI7A 




128 


12ft 1Q1' 








4 


64 


1Q9 901* 






size 


«— 




224..239: 






size 


<r- 


16 


240..247: 






size 


4- 


8 


248..251: 






size 


«— 


4 


252..2S3: 






size 


<- 


2 


254..25S: 







raise Reservedlnstruction 

endcase 

shift <- (opo || simm) and (size-1) 
c 4- RegRead(rc, 128) 
case (op5..2 II 0 2 ) of 
X.COMPRESS.I: 
hsize <- size/2 

for i <- 0 to 64-hsize by hsize 
if shift £ hsize then 

aj+hsize-1.J *- Ci+i+shift+hsize-1..i+i+shift 

else 

aj+hsize-1..i «- tfP&aW? II Ci+j+size-1..i+i+shift 

endif 
endfor 
ai27..64<-0 
X.COMPRESS.I.U: 
hsize <- size/2 

for i <r- 0 to 64-hsize by hsize 
if shift £ hsize then 

ai+hsize-1.J «- Q+i+shffi+hsize-1..i+i+shift 

else 

ai+hsize-1..i «- 0 sm ' hslze || q + j+size-1.J+i+shift 

endif 
endfor 
3127..64 «- 0 



Fig. 43J 



X.EXPAND.I: 

hsize <- size/2 

for i «- 0 to 64-hsize by hsize 
if shift £ hsize then 

aw +S ize-1..W «- cftftBlf || Cj+hsize-l..i H 0$hift 

else 

aw+size-1..i+i «- c i+size-shifl-1.J II ° shift 

end if 
endfor 
X.EXPAND.I.U: 
hsize 4- size/2 

for i <- 0 to 64-hsize by hsize 
if shift £ hsize then 

aw +S ize-1..W «- 0»W»*M* || c^fe^ j || 0$™ 

else 

aw+ S ize-l..W «- q+size-shift-I.J II 

endif 
endfor 
X.SHLI: 

for i 0 to 128-size by size 

aj+size-1..i *- Cj +S ize-1-shifLill 0 shlft 
endfor 
X.SHLI.O: 

for i <~ 0 to 128-size by size 

if Cj +S j2e-1..i+size-1-shift * ^sleJl-shifl 
raise FixedPointArithmetic 

endif 

ai+size-1..i <~ Cj+size-1-shifull 0 shfft 
endfor 
X.SHLI.U.O: 

for i <- 0 to 128-size by size 

if Ci+size-1. J+size-shift * 0 shift then 
raise FixedPointArithmetic 

endif 

ai+stze-1..i «- Cj +s ize-1-shifull 0^ 
endfor 

Fig. 43J (cont) 



X.ROTR.I: 

for i <- 0 to 128-size by size 

ai+size-1..i «- Cj+ S hift-1 " c i+size-1..i+shift 
ndfor 
X.SHR.I: 

for i <- 0 to 128-size by size 

aj+size-1 J *- <f+slze-1 II Cj+size-1 ..i+shift 
endfor 
X.SHR.I.U: 

for i <- 0 to 128-size by size 

aj+size-U «- 0 shlft || c j+si2e _ 1 i+shlft 
endfor 

endcase 

RegWrite(rd, 128,a) 
enddef 



Exceptions 



Fixed-point arithmetic 
Reserved Instruction 



Fig. 43J (cont) 



Operation codes 



X.SHLM.1.2 


Crossbar shift left merge immediate pecks 


vy f% III & a ■ a 

X.SHL.M.1.4 


Crossbar shift left merge immediate nibbles 


X.SHL.M.1.8 


ft ft ft »ft • • ft » a ft . 

Crossbar shift left merge immediate bytes 


V/ III ft A 1 A. 

X.SHLM.L16 


Crossbar shift left merge immediate doublets 


X.SHL.M.1.32 


Crossbar shift left merge immediate quadlets 


ai li a a i a 

X.SHLM.1.64 


a*™% ■ 1 * ft 1 «T« » ft • 1 • B • 

Crossbar shift left merge immediate octlets 


X.SHL.M.1.128 


Crossbar shift left merge immediate hexlet 


X.SHR.M.I.2 


Crossbar shift right merge immediate pecks 


V CUD M 1 A 

A.onK.M.1.4 


urossuar snirt ngnt merge immediate nibbles 


X.SHR.M.1.8 


Crossbar shift right merge immediate bytes 


X.SHR.M.1.16 


Crossbar shift right merge immediate doublets 


X.SHR.M.I.32 


Crossbar shift right merge immediate quadlets 


X.SHR.M.I.64 


Crossbar shift right merge immediate octlets 


X.SHR.M.1.128 


Crossbar shift right merge immediate hexlet 



Fig 43K 



Format 



X.op.size rd@rc,shift 
rd=xopsize(rc,shift) 

31 24 23 18 17 12 11 6 5 0 

I XSHIFTI | rd | rc | simm I op | 

8 6 6 6 6 

t <- 256-2*size+shift 

OP1..0 <~ t7..6 

simm <- t5..o 



Fig 43 L 



Definition 

def CrossbarShortlmmediatelnplace(op,rd,rc f simm) 
case (opi..o II simm) of 



0..127: 




siz 


<- 128 


128..191: 




size 


<- 64 


192..223: 




size 


<-32 


224..239: 




size 


<- 16 


240..247: 




size 


f-8 


248..251: 




size 


<-4 


252..253: 




size 


<-2 


254..255: 





raise Reservedlnstruction 

endcase 

shift <- (opo || simm) and (size-1) 
c <- RegRead(rc, 128) 
d <- RegRead(rd, 128) 
for i <- 0 to 128-size by size 
case (op5..2 II 0 2 ) of 
X.SHR.M.I: 

ai+size-1..i <~ q+$hift-1..i II dj+ S ize-1..i+shift 
X.SHLMJ: 

a i+size-1.J «- di+size-1-shifU II Ci+shitt-1..i 

endcase 
endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

Reserved Instruction 



Fig 43M 



Format 

X. EXTRACT ra=rd,rc,rb 
ra=xextract(rd,rc,rb) 

31 24 23 18 17 12 11 6 5 

OP I rd | rc | rb | ra 

8 6 6 6 6 

Fig. 44A 



Definition 



def CrossbarExtract(op,ra,rb,rc,rd) as 
d 4- RegRead(rd, 128) 
c 4- RegRead(rc. 128) 
b4-RegRead(rb.128) 
cas be..oof 



0..255: 




gsize 


4- 128 


256-383: 




gsize 


4-64 


384..447: 




gsize 


4-32 


448..479: 




gsize 


4-16 


480..495: 




gsize 


4-8 


496..503: 




gsize 


4-4 


504..507: 




gsize 


4-2 


508..511: 




gsize 


4-1 



endcase 
m4-bi2 

as 4- signed 4- bi.4 
h 4- (2-m)*gsize 

spos 4- (be..o) and ((2-m)*gsize-1) 
dpos 4- (0 1| b23..i6) and (gsiz*-1) 
sfsize 4- (0 1| b3i.,24) an< * (gsize-1) 

tfsize 4- (sfsize = 0) or ((sfeize+dpos) > gsize) ? gsize-dpos : sfsize 
fsize 4- (tfsize ♦ spos > h) ? h - spos : tfsize 
f or i 4- 0 to 1 28-gsize by gsize 
case op of 

X. EXTRACT: 
if m then 

P *- dgsize+MJ 

else 

p4-(d I|c)2'(gsize*iKI..2*i 

endif 

endcase 

v4-(as&p h .i)||p 

w 4- (as & Vspos+feize-iP^^P 03 1| v feize .i +S pos..spos II 0 dpos 
if m then 

3size-1+i..i «" c gsize-l+i..dpos*fsize+l II w dpos+fcize-1..dpos II Qdpos-1+1J 

else 

a stze-1+U«-* 

endif 

endfor 

RegWrite(ra. 128, a) 
enddef 



Exceptions 

none 



Fig. 44B 



■+ — foizo > < dpoa 
Crossbar extract 

Fig. 44C 



< — fs i zo — x spoo 




rd 



< — fsiz e — > « dpoa 
Crossbar merge extract 



Fig. 44D 



Operation codes 



E.MUL.X 


Ensemble multiply extract 


E. EXTRACT 


Ensemble extract 


E.SCAL.ADD.X 


Ensemble scale add extract 



Fig. 44E 



Format 



E.op ra=rd,rc,rb 



ra=eop(rd,rc,rb) 

31 24 23 18 17 12 11 , 6 5 

I QP I rd | re | rb | ra 

8 6 6 6 6 



Fig. 44F 



def muKsize.h.vs.v.Kws.wj) as 

mul <- ((vs&v S i 2e .ni) h " siz || v si2 e.i + j..i) # ((ws&w size -i + j) h - sl2e || w si2e _ 1+j . j) 
enddef 

def EnsembleExtractfop.ra.rb.rc.rd) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case b8..o of 
0..255: 

sgsize <- 128 
2S6..383: 

sgsize <- 64 
384..447: 

sgsize <- 32 
448..479: 

sgsize <- 16 
480..495: 

sgsize <- 8 
496..503: 

sgsize <- 4 
504..507: 

sgsize <- 2 
508..511: 

sgsize <- 1 

endcase 

m <- bi2 
* n «- bi3 
signed <- b-|4 
case op of 

E.EXTRACT: 

gsize <- sgsize 
h <- (2-m) # gsize 
as signed 

spos <- (b8..o) and ((2-m)*gsize-1) 
E.SCAL.ADD.X: 

if (sgsize < 8) then 

gsize <- 8 
elseif (sgsize*(n+1) > 32) then 

gsize <-32/(n+1) 

else 

gsize <- sgsize 

endif 

ds <- cs <- signed 

bs «- signed A m 

as <- signed or m or n 

h <- (2*gsize) ♦ 1 + n 

spos (b8..o) and (2*gsize-1) 

Fig. 44G 



E.MULX: 

if(sgsiz < 8) th n 

gsize <- 8 
elseif (sgsize*(n+1 ) > 1 28) then 

gsize <- 128/(n+1) 

else 

gsize <- sgsize 

endif 

ds 4- signed 

os <- signed A m 

as <- signed or m or n 

h <- (2*gsize) + n 

spos <- (b8..o) and (2*gsize-1) 

endcase 

dpos <- (0 || b23..i6) and (gsize-1) 
r <- spos 

sfsize <- (0 || b3i..24) and (gsize-1) 

tfsize <- (sfsize = 0) or ((sfsize+dpos) > gsize) ? gsize-dpos : sfsize 
fsize <- (tfsize + spos > h) ? h - spos : tfsize 
if ( b l0..9 ~ z ) and not as then 
rnd <- F 

else 

rnd<-bio..9 

endif 

for i <- 0 to 128-gsize by gsize 
case op of 

E.EXTRACT: 
if m then 

P<-dgsize+M..i 

else 

p^(d||c)2*(gslze+iH.2*l 

endif 
E.MULX: 
if n then 

if (i and gsize) = 0 then 

p <- muKgsize.h.ds.dJ.cs.c.i) - mul(gsize f h t ds f d t i+size,cs,c,i+size) 

else 

p <- muKgsize^h.ds.d.i.cs.cj+size) + muKgsize.h.ds.d.i.cs.c.i+size) 

endif 

else 

p <- muKgsize.h.ds.dJ.cs.cJ) 

endif 

Fig. 44G (cont) 



E.SCAL.ADD.X: 
if n then 

ifflandgsiz ) = Othen 

p «- mul(gsize f h,ds,d j,bs,b,64+2*gsize) 
+ mul(gsize f h ( cs,c t i t bs f b ( 64) 
-muKgsize.h.ds.d.i+gsize.bs.b.W+S'gsize) 
- muKgsizeXcs.c.i+gsize.bs.b.W+gsize) 

else 

p <- mul(gsize f h,ds,d,i,bs,b,64+3*gsize) 
+ mul(gsize,h,cs,c ,i,bs,b,64+gsize) 
+ mul(gsize f h,ds,dj+gsize,bs,b t 64+2 # gsize) 
+ mul(gsize,h,cs i c f i+gsize i bs,b ( 64) 

end if 

else 

p <- mul(gsize t h f ds ( d,i.bs,b,64+gsize) + muKgsize.h.cs.ci.bs.b.M) 

endif 

endcase 
case rnd of 
N: 

s^O^II-PrllP?- 1 

Z: 
F: 

s<~0 h 

C: 

5 4-0^ || 1 r 

endcase 

v^((as& Ptv1 )||p) + (0||s) 

if (Vh..r+fsize = (as & ^fstz^)^ 1 ^ 110 ) or not ( | and (op = e.EXTRACT)) then 
w ^ (as & v r+fsize . 1 )gsize-fsize^pos || vfefee-1+r.r II 0 d P° s 

else 

W4-(s? (Vh || -vg size ^P° s - 1 ) : igsize-dpos) |j O dpos 

endif 

if m and (op = E.EXTRACT) then 

a size-1+Li Cgsize-l+Ldpos+fsize+i II w dpos+fsize-1..dpos II Cdpos-1+1 i 

else 

asize-1+U^w 

endif 
endfor 

RegWrite(ra, 128, a) 
enddef 

Exceptions 

none 



Fig. 44G (cont) 



X.DEP0SIT.2 


Crossbar deposit signed pecks 


X.DEP0SIT.4 


Crossbar deposit signed nibbles 


X.DEP0SIT.8 


Crossbar deposit signed bytes 


X.DEP0SIT.16 


Crossbar deposit signed doublets 


X.DEPOSIT.32 


Crossbar deposit signed quadlets 


X.DEPOSIT.64 


Crossbar deposit signed octlets 


X.DEPOSIT.128 


Crossbar deposit signed hexlet 


X.DEP0SIT.U.2 


Crossbar deposit unsigned pecks 


X.DEP0SIT.U.4 


Crossbar deposit unsigned nibbles 


X.DEP0SIT.U.8 


Crossbar deposit unsigned bytes 


X.DEP0SIT.U.16 


Crossbar deposit unsigned doublets I 


X.DEPOSIT.U.32 


Crossbar deposit unsigned quadlets 


X.DEPOSIT.U.64 


Crossbar deposit unsigned octlets 


X.DEPOSIT.U.128 


Crossbar deposit unsigned hexlet 


X. WITH DRAW. U.2 


Crossbar withdraw unsigned pecks 


X. WITH DRAW. U.4 


Crossbar withdraw unsigned nibbtes 


X.WITHDRAW.U.8 


Crossbar withdraw unsigned bytes 


X.WITHDRAW.U.16 


Crossbar withdraw unsigned doublets 


X. WITH DRAW. U.32 


Crossbar withdraw unsigned quadlets 


X.WITHDRAW.U.64 


Crossbar withdraw unsigned octlets 


X.WITHDRAW.U.128 


Crossbar withdraw unsigned hexlet 


X.WITHDRAW.2 


Crossbar withdraw pecks f 


X.WITHDRAW.4 


Crossbar withdraw nibbles 


X.WITHDRAW.8 


Crossbar withdraw bytes 


X.WITHDRAW.16 


Crossbar withdraw doublets 


X.WJTHDRAW.32 


Crossbar withdraw quadlets 


X.WITHDRAW.64 


Crossbar withdraw octlets 


X.WITH DRAW. 128 


Crossbar withdraw hexlet 



Fig. 45A 



Equivalencies 



X. SEX. 1.2 


Crossbar extend immediate signed pecks 


X.SEX.1.4 


Crossbar extend immediate signed nibbles 


X.SEX.1.8 


Crossbar extend immediate signed bytes 


XSEX.1.16 


Crossbar extend immediate signed doublets 


X.SEX.1.32 


Crossbar extend immediate signed quadlets 


XSEXI.64 


Crossbar extend immediate signed octlets 


X.SEX.1.128 


Crossbar extend immediate signed hexlet 


X.ZEX.1.2 


Crossbar extend immediate unsigned pecks 


X.ZEX.1.4 


Crossbar extend immediate unsigned nibbles 


X.ZEXI.8 


Crossbar extend immediate unsigned bytes 


X.ZEX.1.16 


Crossbar extend immediate unsigned doublets 


X.ZEX.1.32 


Crossbar extend immediate unsigned quadlets 


X.ZEX.1.64 


Crossbar extend immediate unsigned octlets 


X.ZEX.1.128 


Crossbar extend immediate unsigned hexlet 



X.SHLI.gsize rd=rc,i 


-> 


X.DEPOSIT.gsize rd=rc,size-i,i 


X.SHR.I.gsize rd=rc,i 


-> 


X.WITHDRAW.gsize rd=rc,size-i,i 


X.SHRU.I.gsize rd-rc,i 


-> 


XWITHDRAW.U.gsize rd=rc,size-i,i 


X.SEX.I.gsize rd-rc,i 


-> 


XDEPOSIT.gsize rd=rc,i,0 


X.ZEX.I.gsize rd=rc,i 


-> 


XDEPOSIT.U.gsize rd=rc,i,0 


Redundancies 


X.DEPOSIT.gsize rd-rc,gsize,0 


o 


XCOPY rd=rc 


X.DEPOSIT.U.gsize rd=rc,gsize,0 


<=> 


X.COPY rd=rc 


X.WITHDRAW.gsize rd=rc,gsize,0 


<=> 


X.COPY rd=rc 


X.WITHDRAW.U.gsize rd=rc,gsize,0 


<=> 


XCOPY rd=rc 



Fig. 45A (cont'd) 



Format 



X.op.gsize rd=rc,isize,ishift 
rd=xopgsize(rc,isize,ishift) 

31 26252423 18 17 1211 65 0 

I op I ih I rd | rc | gsfp j gsfs | 

6 2 6 6 6 6 

assert isize+ishift < gsize 
assert isize>1 

iho || gsfs <- 128-gsize+isize-1 
ihi || gsfp <- 128-gsize+ishift 

Fig. 45B 



Definition 

def CrossbarField(op,rd,rc,gsfp,gsfs) as 
c <- RegRead(rc, 128) 
case ((opi || gsfp) and (opo || gsfs)) of 
0..63: 

gsize 128 
64..9S: 

gsize <- 64 
96..111: 

gsize <- 32 
112..119: 

gsize <- 16 
120..123: 

gsize <- 8 
124..125: 

gsize <- 4 

126: 

gsize <- 2 

127: 

raise Reserved Instruction 

endcase 

ishift <- (opi || gsfp) and (gsize-1) 
isize <- ((opo || gsfs) and (gsize-1))+1 
if (ishift+isize>gsize) 

raise Reserved Instruction 

end if 

case op of 

X.DEPOSIT: 

for i 4- 0 to 128-gsize by gsize 

q+gste-U <- c^fe^e-ishift „ cwsfce-1..i II O^hift 
endfor 
X.DEPOSIT.U: 

for i <- 0 to 128-gsize by gsize 

ai+gsize-U <- 09size-isize-ishift || c l+is i ze -i..i || V* m 
endfor 
X.WITHDRAW: 

for i <- 0 to 128-gsize by gsize 

aj+gsize-1..i «- cf+^l+iihift-l II Q+isize+ishifM.j+ishift 
endfor 
X.WITHDRAW.U: 

for i <- 0 to 1 28-gsize by gsize 

aj+gsize-1..i <- 09size-isize || q+bize+tahift-l ..Wshrft 
endfor 

endcase 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

Reserved instruction 

Fig. 45C 



127 



ih,| |gsfp 



ih 0 | | gsfs 



127 



encoding for crossbar field 



Fig. 45D 




crossbar deposit 
Fig. 45E 



< — fstze — ► 
crossbar withdraw 



Fig. 45F 



Op ration codes 



X DEPOSIT M 2 


f^rn^^h^r ripnnQit mprnp nppkQ 


X.DEP0SIT.M.4 


Crossbar deposit merge nibbles 


X.DEP0SIT.M.8 


Crossbar deposit merge bytes 


X.DEP0SIT.M.16 


Crossbar deposit merge doublets 


X.DEPOSIT.M.32 


Crossbar deposit merge quadlets 


X.DEPOSIT.M.64 


Crossbar deposit merge octlets 


X.DEPOSIT.M.128 


Crossbar deposit merge hexlet 



Fig 45G 



Format 



X.op.gsize rd@rc,isize,ishift 
rd=xopgsize(rd,rc,isize,ishift) 

31 26252423 1817 1211 65 0 

I op I ih | rd | rc | gsfp | gsfs | 

6 2 6 6 6 6 

assert isize+ishift < gsize 
assert isize>1 

iho || gsfs <- 128-gsize+isize-1 
ihi || gsfp <- 128-gsize+ishift 



Fig 45H 



Definition 

def CrossbarFieldlnplace(op,rd,rc t gsfp t gsfs) as 
c <- RegRead(rc, 128) 
d <- RegRead(rd, 128) 
case ((op-| || gsfp) and (opo || gsfs)) of 
0..63: 

gsize <- 128 
64..9S: 

gsize <- 64 
96..111: 

gsize <- 32 
112..119: 

gsize ^- 16 
120.. 123: 

gsize 8 
124..125: 

gsize <- 4 

126: 

gsize <- 2 

127: 

raise Reserved Instruction 

endcase 

ishift <- (opi || gsfp) and (gsize-1) 
isize <- ((opo || gsfs) and (gsize-1 ))+1 
if (ishift+isize>gsize) 

raise Reservedlnstruction 

endif 

for i <- 0 to 128-gsize by gsize 

ai+gsize-1J <- di+gsize-1..i+isize+ishift I! Cj+isize-1..» II d|+ishift-1..i 
endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

Reserved instruction 

Fig 451 



< — fsizo — ► 




< — fsiz e — >< dpos 
crossbar deposit merge 



Fig 45J 



X.SHUFFLE.4 


Crossbar shuffle within pecks 


X.SHUFFLE.8 


Crossbar shuffle within bytes 


X.SnUrrLc.16 


Crossbar shuffle within doublets 


X.SHUFFLE.32 


Crossbar shuffle within quadlets 1 


X.SHUFFLE.64 


Crossbar shuffle within octlets 


X.SHUFFLE.128 


Crossbar shuffle within hexlet 


X.SHUFFLE.256 


Crossbar shuffle within triclet 



Fig.46A 



Format 



X.SHUFFLE.256 rd=rc,rb,v,w,h 
X.SHUFFLE.size rd=rcb,v,w 

rd=xshuffle256(rc,rb,v,w,h) 
rd=xshufflesize(rcb,v,w) 

31 24 23 18 17 12 11 6 5 0 

j xlSHUFFLE | rd | rc I rb | op | 

8 6 6 6 6 

rc <- rb <- rcb 
x<-log2(size) 
y<-log2(v) 
Z4-log2(w) 

op «- ((x*x*x-3*x*x-4*x)/6-(z*z-z)/2+x*z+y) + (size=256)*(h*32-56) 



Fig. 46B 



Definition 



def CrossbarShufflefmajor.rd.rc.rb.op) 
c«- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
if rc=rb then 
case op of 
0..55: 

for x <- 2 to 7; for y 4- 0 to x-2; for z <- 1 to x-y-1 

if op = ((x*x*x-3Vx-4*x)/6-(z*z-z)/2+x*z+y) then 
fori<-0to127 

a i ^ c 06.jc II iy*z-1..y II ix.1..y>z II iy-1..0) 

end 

end if 

endfor; endfor; endfor 
56..63: 

raise Reservedinstruction 

endcase 

elseif 

case op4„o of 
0..27: 

cb «- c || b 
x «- 8 
h <- ops 

for y <- 0 to x-2; for z <- 1 to x-y-1 
if op 4 ..o = ((1 7*z-z*z)/2-8+y) then 
fori«-h # 128to127+h*128 

aj.h-128 «- CbOy^.L.y || ix-1..y+z || iy.L.0) 

end 

end if 
endfor; endfor 
28..31: 

raise Reservedinstruction 

endcase 

endif 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Reserved Instruction 



Fig.46C 



127 rcb(128) o 




127 



rd(128) o 



4-way shuffle bytes within hexlet 



Fig. 46D 




12? rd(128) o 



4-way shuffle bytes within triclet 
Fig. 46E 



Format 



X.SWIZZLE rd=rc,icopy,iswap 
rd=xswizzle(rc,icopy f iswap) 

31 26 2524 23 1817 12 11 6 5 0 

| X.SWIZZLE | ih | rd | rc | icopya \ iswapa H 

6 2 6 6 6 6 

icopya <- icopy 5 .. 0 
iswapa <- iswap5..o 
ih <- icopye 1 1 iswap6 

Fig.47A 



Definition 

def GroupSwizzIelmmediatefih.rd.rcjcopyajswapa) as 
icopy <- ihj || icopya 

iswap 4- i ho || iswapa 
c <- RegRead(rc, 128) 
fori<-0to127 

ai «- C(| & jcopy) a i SW ap 
endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

none 



Fig. 47B 




16-bit reverse 



Fig. 47C 



IX.SELECT.8 



Crossbar select bytes 



Format 



op ra=rd,rc,rb 



ra=op(rd,rc,rb) 

31 24 23 18 17 12 11 65 

I op I rd | rc | rb | "ra" 

8 6 6 6 6 

Fig. 47D 



Definition 

def CrossbarTernary(op,rd,rc,rb t ra) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
dc «- d || c 
fori<-0to15 
j <- bs*i+4..8 # i 

a8 # i+7..8*i <- dC8*j+7..8*j 
endfor 

RegWrite(ra f 128, a) 
enddef 

Exceptions 

none 

Fig. 47E 



Pin summary 



A20M# 


I 


Addr ss bit 20 Mask is an emulator signal. 


A31..A3 


IO 


Addr ss, in combination with byte enabl , indicate the 
physical addresses of memory or device that is the target 
of a bus transaction. This signal is an output, when the 
processor is initiating the bus transaction, and an input 
when the processor is receiving an inquire transaction or 
snooping another processor's bus transaction. 


ADS# 


IO 


ADdress Strobe, when asserted, indicates new bus 
transaction by the processor, with valid address and byte 
enable simultaneously driven. 


ADSC# 


0 


Address Strobe Copy is driven identically to address 
strobe 


AHOLD 


I 


Address HOLD, when asserted, causes the processor to 
cease driving address and address parity in the next bus 
clock cycle. 


AP 


IO 


Address Parity contains even parity on the same cycle as 
address. Address parity is generated by the processor 
when address is an output, and is checked when address 
is an input. A parity error causes a bus error machine 
check. 


APCHK# 


0 


Address Parity CHecK is asserted two bus clocks after 
EADS# if address parity is not even parity of address. 


APICEN 


I 


Advanced Programmable Interrupt Controller ENable 

is not implemented. 


BE7#..BE0# 


IO 


Byte Enable indicates which bytes are the subject of a 
read or write transaction and are driven on the same cycle 
as address. 


BF1..BF0 


I 


Bus Frequency is sampled to permit software to select 
the ratio of the processor clock to the bus clock. 


BOFF# 


I 


BackOFF is sampled on the rising edge of each bus clock, 
and when asserted, the processor floats bus signals on the 
next bus clock and aborts the current bus cycle, until the 
backoff signal is sampled negated. 


BP3..BP0 


0 


Breakpoint is an emulator signal. 


BRDY# 


I 


Bus ReaDY indicates that valid data is present on data on 
a read transaction, or that data has been accepted on a 
write transaction. 


BRDYC# 


I 


Bus ReaDY Copy is identical to BRDY#; asserting either 
signal has the same effect. 


BREQ 


0 


Bus REQuest indicates a processor initiated bus request. 



Fig. 48 



BUSCHK# 


1 


BUS CHecK is sampled on the rising edge of the bus 
clock, and when asserted, causes a bus error machine 
check. 


CACHE# 


0 


CACHE, when asserted, indicates a cacheable read 
transaction or a burst write transaction. 


CLK 


1 


bus CLocK provides the bus clock timing edge and the 
frequency reference for the processor clock. 


CPUTYP 


1 


CPU TYPe, if low indicates the primary processor, if high, 
the dual processor. 


D/C# 


1 


Data/Code is driven with the address signal to indicate 
data, code, or special cycles. 


D63..D0 


10 


Data communicates 64 bits of data per bus clock. 


D/P# 


0 


Dual/Primary is driven (asserted, low) with address on 
the primary processor 


DP7..DP0 


10 


Data Parity contains even parity on the same cycle as 
data. A parity error causes a bus error machine check. 


DPEN# 


10 


Dual Processing Enable is asserted (driven low) by a 
Dual processor at reset and sampled by a Primary 
processor at the falling edge of reset. 


EADS# 


1 


External Address Strobe indicates that an external 
device has driven address for an inquire cycle. 


EWBE# 


1 


External Write Buffer Empty indicates that the external 
system has no pending write. 


FERR# 


0 


Floating point ERRor is an emulator signal. 


FLUSH# 


1 


cache FLUSH is an emulator signal. 


FRCMC# 


1 


Functional Redundancy Checking Master/Checker is 

not implemented. 


HIT# 


10 


HIT indicates that an inquire cycle or cache snoop hits a 
valid line. 


HITM# 


10 


HIT to a Modfied line indicates that an inquire cycle or 
cache snoop hits a sub-block in the M cache state. 


HLDA 


0 


bus HoLD Acknowlege is asserted (driven high) to 
acknowlege a bus hold request 


HOLD 


1 


bus HOLD request causes the processor to float most of 
its pins and assert bus hold acknowlege after completing 
all outstanding bus transactions, or during reset. 


IERR# 


0 


Internal ERRor is an emulator signal. 


IGNNE# 


1 


IGNore Numeric Error is an emulator siqnal. 


INIT 


1 


INITialization is an emulator signal. 1 


INTR 


1 


maskable IN TeRrupt is an emulator siqnal. 


INV 


1 


INValidation controls whether to invalidate the addressed 
cache sub-block on an inqure transaction. 



Fig. 48 (c nfd) 



KEN# 


1 


Cache ENable is driven with address to indicate that the 

rpari or write transartion is canhpahlp 


LINT1..LINT0 


1 


Local INT rrupt is not implemented. 




o 


hue LOflVC is rlrix/pn ctzirtinn with arirfrpss anrl pnriinn 

UU9 LV/vi\ IO UMVCI 1 010 1 III IM Willi aUUIC99 Cil IVJ wllvJIIIM 

after bus ready to indicate a locked series of bus 
transactions 


M/IO# 

IVI/ 1 \S7T 


o 


Memorv/lnout Outnut is driven with address to indicate a 
memory or I/O transaction. 


NA# 


1 


Next Address indicates that the external system will 

arppnt an arirlrp<i«i fnr a npw hus rvHp in two hiiQ Hnrks 

OVAsw^sl Oil hUUI«99 IWI CI llwVr UU9 wjfwlw III IWU UUv UlUvlxO > 


NMI 


1 


Non Maskable Interrupt is an emulator signal. 




in 


Driv/ata Due ^raMT ic H ri\/on hotu/oon Drimon/ onH Piiiol 

rnvaie dus orari i is u riven uciwccii r nrnary anu uuai 
processors to indicate that bus arbitration has completed, 

nrantinn ck now m actor arrocc tn tho hi ic 


PBREQ# 


IO 


Private Bus REQuest is driven between Primary and Dual 

nrnrocenre tn rani inct o nouti moctor apfoee tn IK a Ki ic 


PCD 


O 


Page Cache Disable is driven with address to indicate a 
not cacheable transaction. 


PCHK# 


0 


Parity CHecK is asserted (driven low) two bus clocks after 
aaia appears wiin ouu paniy on enauieu oyies. 


PHIT# 


IO 


Private HIT is driven between Primary and Dual 
processors to indicate that the current read or write 
transaction addresses a valid cache sub-block in the slave 

piuoe&our. 


PHITM# 


10 


Private HIT Modified is driven between Primary and Dual 
pr uoeobur 0 iu inuicaie inai ine current reau or write 
transaction addresses a modified cache sub-block in the 


PICCLK 


1 


Programmable Interrupt Controller CLocK is not 

imnlpmontoH 

II 1 IplCI 1 Id IICU. 


PICD1 PICD 

o 


IO 

Iv 


Pmnrsmnmsihlo 1 ntorn int Onnf rnllor Data ic nnt 

imnlpmpntprl 

II 1 IL/lv7l 1 Ivl 1 ICU . 


PEN# 


1 


Parity Enable, if active on the data cycle, allows a parity 

prror tr> causp p hiiQ prror mpphinp phock 

Cllwl IU U1UOC a UUd CI 1 \Jl 1 1 IdVsl III l\7 wl ICrVsiX. 


PM1 PMO 

1 IVI 1 • • 1 IVI V/ 


o 


PprfnrmancA Mnnitorinn is an pmiilatnr cinnal 
ivi iwi iiiauw iviv/i 11 ii#i 11 iij 10 ail diiuiaiui oiyiiai. 


PRDY 

1 1 \ L-/ 1 


o 


Prohp RpaHY is not imnlpmpntprl 

1 1 V/Mw IwQU 1 IO 1 IUl II 1 I)jlv7l 1 Iv7l llwU. 


PWT 


0 


Page Write Through is driven with address to indicate a 
not write allocate transaction. 


R/S# 


1 


Run/StoD is not imDlemented 


RESET 


1 


RESET causes a processor reset. 


SCYC 


o 


Split CYCIe is asserted during bus lock to indicate that 
more than two transactions are in the series of bus 
transactions. 



Fig. 48 (cont'd) 



SMI# 


1 


System Management Interrupt is an emulator signal. 


SMIACT# 


0 


System Manag ment Interrupt ACTive is an emulator 
signal. 


STPCLK# 


1 


ST P CLocK is an emulator signal. 


TCK 


1 


Test CLocK follows IEEE 1 149.1 . 


TDI 


1 


Test Data Input follows IEEE 1149.1. 


TDO 


0 


Test Data Output follows IEEE 1 149.1. 


TMS 


1 


Test Mode Select follows IEEE 1 149.1 . 


TRST# 


1 


Test ReSeT follows IEEE 1 149.1 . 


VCC2 


1 


VCCof2.8V at 25 pins 


VCC3 


1 


VCCof3.3V at 28 pins 


VCC2DET# 


0 


VCC2 DETect sets appropriate VCC2 voltage level. 


VSS 


1 


VSS supplied at 53 pins 


W/R# 


0 


Write/Read is driven with address to indicate write vs. 
read transaction. 


WB/WT# 


1 


Write Back/Write Through is returned to indicate that 
data is permitted to be cached as write back. 



Fig. 48 (cont'd) 



Electrical Specifications 



Clock rate 


66 MHz 


75 MHz 


100 MHz 


133 MHz 




Parameter 


min 


max 


min 


max 


min 


max 


min 


max 


unit 


CLK frequency 


33.3 


66.7 


37.5 


75 


50 


100 




133 


MH 

z 


CLK period 


15.0 


30.0 


13.3 


26.3 


10.0 


20.0 






ns 


CLK high time (^2v) 


4.0 




4.0 




3.0 








ns 


CLK low time (<0.8V) 


4.0 




4.0 




3.0 








ns 


CLK rise time (0.8V->2V) 


0.15 


1.5 


0.15 


1.5 


0.15 


1.5 






ns 


CLK fall time (2V->0.8V) 


0.15 


1.5 


0.15 


1.5 


0.15 


1.5 






ns 


CLK period stability 




250 




250 




250 






ps 



Fig. 49A 



A31..3 valid delay 


1.1 


6.3 


1.1 


4.5 


1.1 


4.0 






ns 


A31..3 float delay 




10.0 




7.0 




7.0 






ns ! 


ADS# valid delay 


1.0 


6.0 


1.0 


4.5 


1.0 


4.0 






ns 


ADS# float delay 




10.0 




7.0 




7.0 






ns 


ADSC# valid delay 


1.0 


7.0 


1.0 


4.5 


1.0 


4.0 






ns i 


ADSC# float delay 




10.0 




7.0 




7.0 






ns 


AP valid delay 


1.0 


8.5 


1.0 


5.5 


1.0 


5.5 






ns 


AP float delay 




10.0 




7.0 




7.0 






ns 


APCHK# valid delay 


1.0 


8.3 


1.0 


4.5 


1.0 


4.5 






ns 


BE7..0# valid delay 


1.0 


7.0 


1.0 


4.5 


1.0 


4.0 






ns 


BE7..0# float delay 




10.0 




7.0 




7.0 






ns 


BP3..0 valid delay 


1.0 


10.0 














ns 


BREQ valid delay 


1.0 


8.0 


1.0 


4.5 


1.0 


4.0 






ns 


CACHE# valid delay 


1.0 


7.0 


1.0 


4.5 


1.0 


4.0 






ns 


CACHE# float delay 




10.0 




7.0 




7.0 






ns 


D/C# valid delay 


1.0 


7.0 


1.0 


4.5 


1.0 


4.0 






ns 


D/C# float delay 




10.0 




7.0 




7.0 






ns 


D63..0 write data valid delay 


1.3 


7.5 


1.3 


4.5 


1.3 


4.5 






ns 


D63..0 write data float delay 




10.0 




7.0 




7.0 






ns 


DP7..0 write data valid delay 


1.3 


7.5 


1.3 


4.5 


1.3 


4.5 






ns 


DP7..0 write data float delay 




10.0 




7.0 




7.0 






ns 


FERR# valid delay 


1.0 


8.3 


1.0 


4.5 


1.0 


4.5 






ns 


HIT# valid delay 


1.0 


6.8 


1.0 


4.5 


1.0 


4.0 






ns 


HITM# valid delay 


1.1 


6.0 


1.1 


4.5 


1.1 


4.0 






ns 


HLDA valid delay 


1.0 


6.8 


1.0 


4.5 


1.0 


4.0 






ns 


IERR# valid delay 


1.0 


8.3 














ns 


LOCK# valid delay 


1.1 


7.0 


1.1 


4.5 


1.1 


4.0 






ns 


LOCK# float delay 




10.0 




7.0 




7.0 






ns 


M/IO# valid delay 


1.0 


5.9 


1.0 


4.5 


1.0 


4.0 






ns 


M/IO# float delay 




10.0 




7.0 




7.0 






ns 


PCD valid delay 


1.0 


7.0 


1.0 


4.5 


1.0 


4.0 






ns 


PCD float delay 




10.0 




7.0 




7.0 






ns 


PCHK# valid delay 


1.0 


7.0 


1.0 


4.5 


1.0 


4.5 






ns 


PM1..0 valid delay 


1.0 


10.0 














ns 


PRDY valid delav 


1.0 


8.0 














ns 


PWT valid delay 


1.0 


7.0 


1.0 


4.5 


1.0 


4.0 






ns 


PWT float delay 




10.0 




7.0 




7.0 






ns 


SCYC valid delay 


1.0 


7.0 


1.0 


4.5 


1.0 


4.0 






ns 


outo Tioat delay 




10.0 




7.0 




7.0 






ns 


SMIACT# valid delay 


1.0 


7.3 


1.0 


4.5 


1.0 


4.0 






ns 


W/R# valid delay 


1.0 


7.0 


1.0 


4.5 


1.0 


4.0 






ns 


W/R# float delay 




10.0 




7.0 




7.0 






ns 
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A31..5 setup time 


6.0 




3.0 




3.0 








ns 


A31..5 hold time 


1.0 




1.0 




1.0 








ns 


A20M# setup time 


5.0 




3.0 




3.0 








ns 


A20M# hold time 


1.0 




1.0 




1.0 








ns 


AHOLD setup time 


5.5 




3.5 




3.5 








ns 


AHOLD hold time 


1.0 




1.0 




1.0 








ns 


AP setup time 


5.0 




1.7 




1.7 








ns 


AP hold time 


1.0 




1.0 




1.0 








ns 


BOFF# setup time 


5.5 




3.5 




3.5 








ns 


BOFF# hold time 


1.0 




1.0 




1.0 








ns 


BRDY# setup time 


5.0 




3.0 




3.0 








ns 


BRDY# hold time 


1.0 




1.0 




1.0 








ns 


BRDYC# setup time 


5.0 




3.0 




3.0 








ns 


BRDYC# hold time 


1.0 




1.0 




1.0 








ns 


BUSCHK# setup time 


5.0 




3.0 




3.0 








ns 


BUSCHK# hold time 


1.0 




1.0 




1.0 








ns 


D63..0 read data setup time 


2.8 




1.7 




1.7 








ns 


D63..0 read data hold time 


1.5 




1.5 




1.5 








ns 


DP7..0 read data setup time 


2.8 




1.7 




1.7 








ns 


DP7..0 read data hold time 


1.5 




1.5 




1.5 








ns 


EADS# setup time 


5.0 




3.0 




3.0 








ns 


EADS# hold time 


1.0 




1.0 




1.0 








ns 


EWBE# setup time 


5.0 




1.7 




1.7 








ns 


EWBE# hold time 


1.0 




1.0 




1.0 








ns 


FLUSH# setup time 


5.0 




1.7 




1.7 








ns 


FLUSH# hold time 


1.0 




1.0 




1.0 








ns 


FLUSH# asvnc pulse width 


2 




2 




2 








CLK 


HOLD setup time 


5.0 




1.7 




1.7 








ns 


HOLD hold time 


1.5 




1.5 




1.5 








ns 


IGNNE# setup time 


5.0 




1.7 




1.7 








ns 


IGNNE# hold time 


1.0 




1.0 




1.0 








ns 


IGNNE# asvnc Dulse width 


2 




2 




2 








CLK 


I NIT setup time 


5.0 




1.7 




1.7 








ns 


INIT hold time 


1.0 




1.0 




1.0 








ns 


I NIT asvnc pulse width 


2 




2 




2 








CLK 


INTR setup time 


5.0 




1.7 




1.7 








ns 


INTR hold time 


1.0 




1.0 




1.0 








ns 


INV setup time 


CO 




1.7 




1.7 








ns 


INV hold time 


1.0 




1.0 




1.0 








ns 


KEN# setup time 


5.0 




3.0 




3.0 








ns 


KEN# hold time 


1.0 




1.0 




1.0 








ns 


NA# setup time 


4.5 




1.7 




1.7 








ns 



Fig. 49C 



NA# hold time 


1.0 




A A 

1.0 




A 

1.0 








ns 


NMI setup time 


5.0 




1.7 




1.7 








ns 


KIAJII UaU 

NMI hold time 


1.0 




A f\ 

1.0 




1.0 








ns 


NMI asvnc pulse width 


2 




2 




2 








CLK 


rbNff setup time 


/I o 

4.8 




A T 

1.7 




1.7 








ns 


ntiw noio time 


A ft 
l.U 




1.0 




1.0 








ns 


K/off setup time 


0.0 




1.7 




1.7 








ns 


K/s# hold time 


1.0 




1.0 




1.0 








ns 


R/S# asvnc pulse width 


2 




2 




2 








CLK 


SMl# setup time 


5.0 




1.7 




1.7 








ns 


5Ml# hold time 


A f\ 

1.0 




1.0 




A f\ 

1.0 








ns 


SMI# asvnc nutep width i 


2 




o 




o 
c 










STPCLK# setup time 


5.0 




1.7 




1.7 








ns 


STPCLK# hold time 


1.0 




1.0 




1.0 








ns 


WB/WT# setup time 


4.5 




1.7 




1.7 








ns 


WB/WT# hold time 


1.0 




1.0 




1.0 








ns 
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RESET setup time 


5.0 




1.7 




1.7 








ns 


RESET hold time 


1.0 




1.0 




1.0 








ns 


RESET pulse width 


15 




15 




15 








CLK 


RESET active 


1.0 




1.0 




1.0 








ms 


BF2..0 setup time 


1.0 




1.0 




1.0 








ms 


BF2..0 hold time 


2 




2 




2 








CLK 


BRDYC# hold time 


1.0 




1.0 




1.0 








ns 


BRDYC# setup time 


2 




2 




2 








CLK 


BRDYC# hold time 


2 




2 




2 








CLK 


FLUSH# setup time 


5.0 




1.7 




1.7 








ns 


FLUSH# hold time 


1.0 




1.0 




1.0 








ns 


FLUSH# setup time 


2 




2 




2 










FLUSH# hold time 


2 




2 




2 











Fig. 49D 



PBRFO# fliaht time 


0 


2 0 














nc 
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Operation codes 



L.8 


Load signed byte 


L16.B 


Load signed doublet big-endian 


L.16.A.B 


Load signed doublet aligned big-endian 


L16.L 


Load signed doublet little-endian 


L16.A.L 


Load signed doublet aligned little-endian 


L.32.B 


Load signed quadlet big-endian 


L.32.A.B 


Load signed quadlet aligned big-endian 


L.32.L 


Load signed quadlet little-endian 


L.32.A.L 


Load signed quadlet aligned little-endian 


L.64.B 


Load signed octlet big-endian 


L.64.A.B 


Load signed octlet aligned big-endian j 


L.64.L 


Load signed octlet little-endian 


L.64.A.L 


Load signed octlet aligned little-endian 


L128.B 


Load hexlet big-endian 


L128.A.B 


Load hexlet aligned big-endian 


L128.L 


Load hexlet little-endian I 


L128.A.L 


Load hexlet aligned little-endian 


L.U.8 


Load unsigned byte 


LU.16.B 


Load unsigned doublet big-endian 


LU.16.A.B 


Load unsigned doublet aligned big-endian 


LU.16.L 


Load unsigned doublet little-endian 


LU.16.A.L 


Load unsigned doublet aligned little-endian 


L.U.32.B 


Load unsigned quadlet big-endian 


L.U.32.A.B 


Load unsigned quadlet aligned big-endian 


LU.32.L 


Load unsigned quadlet little-endian | 


L.U.32.A.L 


Load unsigned quadlet aligned little-endian 


L.U.64.B 


Load unsigned octlet big-endian 


L.U.64.A.B 


Load unsigned octlet aligned big-endian 


L.U.64.L 


Load unsigned octlet little-endian 


L.U.64.A.L 


Load unsigned octlet aligned little-endian 



Fig. 50A 



S lection 



number format 


type 


size 


alignment 


ordering 


signed byte 
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unsigned byte 
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signed integer 
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signed integer aligned 
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L B 


unsigned integer 


U 


16 32 64 




L B 


unsigned integer aligned 


U 


16 32 64 


A 


L B 


register 




128 




L B 


register aligned 




128 


A 


L B 



Format 



op rd=rc,rb 
rd=op(rc,rb) 

31 24 23 1817 12 11 6 5 0 

I L.MINOR | rd | rc | rb | op ~| 

8 6 6 6 6 



Fig. 50B 



Definition 

def Load(op,rd,rc,rb) as 
case op of 

L16L, L32L, L8, L16AL. L32AL, L16B, L32B, L16AB, L32AB, 
L64L, L64AL. L64B, L64AB: 
signed <- true 

LU16L. LU32L, LU8, LU16AL, LU32AL, LU16B. LU32B, LU16AB, LU32AB, 
LU64L. LU64AL, LU64B. LU64AB: 

signed <- false 
L128L, L128AL, L128B, L128AB: 

signed <- undefined 

endcase 
case op of 
L8.LU8: 

size «-8 

L16L, LU16L, L16AL, LU16AL, L16B, LU16B, L16AB, LU16AB: 
size <- 16 

L32L, LU32L, L32AL, LU32AL, L32B, LU32B, L32AB. LU32AB: 
size <- 32 

L64L, LU64L, L64AL, LU64AL, L64B, LU64B, L64AB, LU64AB: 

sizs < 64 
L128L, L128AL, L128B, L128AB: 

size<- 128 

endcase 

Isize <- log(size) 

case op of 

L16L, LU16L, L32L, LU32L, L64L, LU64L, L128L. 
L16AL, LU16AL, L32AL, LU32AL, L64AL, LU64AL, L128AL: 
order <- L 

L16B, LU16B, L32B, LU32B, L64B, LU64B, L128B, 

L16AB, LU16AB, L32AB, LU32AB, L64AB, LU64AB, L128AB: 

order <- B 
L8, LU8: 

order <- undefined 

endcase 



Fig. 50C 



c «- RegRead(rc, 64) 

b <- RegRead(rt), 64) 

VirtAddr <- c + (b 6 6-lsize..O II 0 lsize - 3 ) 

case op of 

L16AL, LU16AL, L32AL, LU32AL, L64AL, LU64AL, L128AL, 
L16AB, LU16AB, L32AB, LU32AB, L64AB, LU64AB, L128AB: 
if (C|size-4..0 ^ 0 then 

raise AccessDisallowedByVirtualAddress 

endif 

L16L, LU16L, L32L, LU32L, L64L, LU64L, L128L, 
L16B, LU16B, L32B, LU32B, L64B, LU64B, L128B: 
L8, LU8: 
endcase 

m <- LoadMemory(c t WtAddr,size,order) 
a «- (™size-1 and signed) 1 28-size || m 
RegWrite(rd, 128, a) 
nddef 

Exceptions 

Access disallowed by virtual address 
Access disallowed by tag 
Access disallowed by global TB 
Access disallowed by local TB 
Access detail required by tag 
Access detail required by local TB 
Access detail required by global TB 
Local TB miss 
Global TB miss 

Fig. 50C (cont) 



Operation cod s 



L.1.8 


Load immediate signed byte 


LI.16AB 


Load immediate signed doublet aligned big-endian 


LI.16.B 


Load immediate signed doublet big-endian 


LI.16.A.L 


Load immediate signed doublet aligned little-endian 


L.I.16.L 


Load immediate signed doublet little-endian 


LI.32.A.B 


Load immediate signed quadlet aligned big-endian 


LI.32.B 


Load immediate signed quadlet big-endian 


L.I.32AL 


Load immediate signed quadlet aligned little-endian 


LI.32.L 


Load immediate signed quadlet little-endian 


LI.64.A.B 


Load immediate signed octlet aligned big-endian 


LI.64.B 


Load immediate signed octlet big-endian 


LI.64.A.L 


Load immediate signed octlet aligned little-endian 


L.I.64.L 


Load immediate signed octlet little-endian 


L.I.128.A.B 


Load immediate hexlet aligned big-endian 


LI.128.B 


Load immediate hexlet big-endian 


LI.128AL 


Load immediate hexlet aligned little-endian 


LI.128.L 


Load immediate hexlet little-endian 


L.I.U.8 


Load immediate unsigned byte 


LI.U.16AB 


Load immediate unsigned doublet aligned big-endian 


LI.U.16.B 


Load immediate unsigned doublet big-endian 


LI.U.16AL 


Load immediate unsigned doublet aligned little-endian 


LI.U.16.L 


Load immediate unsigned doublet little-endian 


LI.U.32AB 


Load immediate unsigned quadlet aligned big-endian 


L.I.U.32.B 


Load immediate unsigned quadlet big-endian 


LI.U.32AL 


Load immediate unsigned quadlet aligned little-endian 


LI.U.32.L 


Load immediate unsigned quadlet little-endian 


L.I.U.64AB 


Load immediate unsigned octlet aligned big-endian 


L.I.U.64.B 


Load immediate unsigned octlet big-endian 


L.I.U.64AL 


Load immediate unsigned octlet aligned little-endian 


L.I.U.64.L 


Load immediate unsigned octlet little-endian 



Fig. 51A 



Selection 



number format 


type 


size 


aiignrneni 


oraenng 


signeo Dyie 




o 
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unsigned byte 


U 


8 






signed integer 
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L B 


signed integer aligned 




16 32 64 
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L B 


unsigned integer 


U 


16 32 64 




L B 


unsigned integer aligned 


U 


16 32 64 


A 


L B 


register 




128 




L B 


register aligned 




128 


A 


L B 



Format 



op rd=rc,offset 
rd=op(rc,offset) 

31 24 23 18 17 12 11 0 

f op | rd | rc j offset 

8 6 6 12 



Fig. 51 B 



Definition 



def Loadlmmediate(op,rd,rc,offset) as 
case op of 

LI16L, LI32L. LI8. LI16AL. LI32AL. LI16B, LI32B, LI16AB, LI32AB: 
LI64L. LI64AL, LI64B, LI64AB: 

signed <- true 
LIU16L, LIU32L, LIU8, LIU16AL, LIU32AL, . 
LIU16B, LIU32B, LIU16AB, LIU32AB: 
LIU64L, LIU64AL, LIU64B, LIU54AB: 

signed +- false 
LI128L, LI128AL, LI128B, LI128AB: 

signed «- undefined 

endcase 
case op of 
LI8, LIU8: 
size <- 8 

LI16L, LIU16L, LI16AL, LIU16AL, LI16B, UU16B, LI16AB, LIU16AB: 
size*- 16 

LI32L, LIU32L. LI32AL, LIU32AL, LI32B, LIU32B, LI32AB, LIU32AB: 
size <- 32 

LI64L, LIU64L, LI64AL, LIU64AL, LI64B, LIU84B, LI64AB, LIU64AB: 

LI128L, LI128AL, LI128B, LI128AB: 
size 128 

endcase 

Isize <- log(size) 

case op of 

LI16L, LIU16L, LI32L, LIU32L, LI64L, LIU64L, LI128L, 
LI16AL, LIU16AL, LI32AL, LIU32AL, LI64AL, LIU64AL, LI128AL: 
order <- LI 

LI16B, LIU16B, LI32B, LIU32B, LI64B, LIU64B, LI128B, 

LI16AB, LIU16AB, LI32AB, LIU32AB, U64AB, LIU64AB, LI128AB: 

order <- B 
LI8, LIU8: 

order <- undefined 

endcase 



Fig. 51 C 



c <- RegRead(rc, 64) 

VirtAddr <- c + (offset^ 1 ** || offset || 0 ,siz *- 3 ) 
case op of 

LI16AL, LIU16AL, LI32AL, LIU32AL, LI64AL, LIU64AL, LI128AL, 
LI16AB, LIU16AB, LI32AB, LIU32AB, LI64AB, LIU64AB, LI128AB: 

*f (C|size-4..0 * 0 fr en 

raise AccessDisallowedByVirtualAddress 

endif 

LI16L, LIU16L, LI32L, UU32L, LI64L, LIU64L, LI128L, 
LI16B, UU16B, LI32B, LIU32B, LI64B, UU64B, U128B: 
LI8, LIU8: 
endcase 

m <- LoadMemory(c,VirtAddi\size,order) 
a «- (m$tee-1 and signed) 1 28-size || m 
RegWrite(rd, 128, a) 
enddef 

Exceptions 

Access disallowed by virtual address 
Access disallowed by tag 
Access disallowed by global TB 
Access disallowed by local TB 
Access detail required by tag 
Access detail required by local TB 
Access detail required by global TB 
Local TB miss 
Global TB miss 

Fig. 51C(cont) 



Operation codes 



S.8 


Store byte 


S.16.B 


Store double big-endian 


S.16.A.B 


Store double aligned big-endian 


S.16.L 


Store double little-endian 


S.16.A.L 


Store double aligned little-endian 


S.32.B 


Store quadlet big-endian 


S.32.A.B 


Store quadlet aligned big-endian 


S.32.L 


Store quadlet little-endian 


S.32.A.L 


Store quadlet aligned little-endian 


S.64.B 


Store octlet big-endian 


S.64.A.B 


Store octlet aligned big-endian 


S.64.L 


Store octlet little-endian 


S.64AL 


Store octlet aligned little-endian 


S.128.B 


Store hexlet big-endian 


S.128.A.B 


Store hexlet aligned big-endian 


S.128.L 


Store hexlet little-endian 


S.128.A.L 


Store hexlet aligned little-endian 


S.MUX.64.A.B 


Store multiplex octlet aligned big-endian 


S.MUX.64.A.L 


Store multiplex octlet aligned little-endian j 



Fig. 52A 



Selection 



number format 


op 


size 


alignment 


ordering 


byte 




8 






integer 




16 32 64 128 




L B 


integer aligned 




16 32 64 128 


A 


L B 


multiplex 


MUX 


64 


A 


L B 



Format 



op rd.rc.rb 
op(rd,rc,rb) 

31 24 23 18 17 12 11 65 0 

I sTmINOR I rd j re | rb | op | 

8 6 6 6 6 
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Definition 



def Store(op,rd,rc,rb) as 
case op of 
S8: 

size «- 8 
S16L, S16AL, S16B, S16AB: 

size ^-16 
S32L t S32AL, S32B, S32AB: 

size «- 32 
S64L, S64AL, S64B, S64AB, 
SMUX64AB, SMUX64AL: 

size <- 64 
S128L, S128AL, S128B, S128AB: 

size <- 128 

endcase 
Isize <r- log(size) 
case op of 
S8: 

order <- undefined 
S16L, S32L, S64L, S128L, 
S16AL, S32AL, S64AL, S128AL, SMUX64ALI: 

order «- L 
S16B, S32B f S64B, S128B, 
S1 6AB, S32AB, S64AB, S1 28AB, SMUX64ABI: 

order <- B 

endcase 

c «- RegRead(rc t 64) 

b <- RegRead(rb, 64) 

VirtAddr <- c + (b 6 6-lsize..O II 0 ,size - 3 ) 

case op of 

S16AL, S32AL, S64AL, S1 28AL, 

S16AB, S32AB, S64AB, S128AB, 

SMUX64AB, SMUX64AL: 

if (C|size-4..0 ^ 0 ^ en 

raise AccessDisallowedByVtrtualAddress 

endif 

S16L.S32L.S64L, S128L, 
S16B, S32B, S64B, S128B: 
S8: 
endcase 



Fig. 52C 



d 4- RegRead(rd, 128) 
case op of 
S8, 

S16L,S16AL, S16B, S16AB, 
S32L, S32AL, S32B, S32AB, 
S64L, S64AL, S64B, S64AB, 
S128L, S128AL, S128B, S128AB: 

StoreMemory(c,VirtAddr t size,order,d S i 2 e.i..o) 
SMUX64AB, SMUX64AL: 

lock 

a <- LoadMemoryWfc.VirtAddr.size.order) 

m *- (di27..64 & d63..0) I (a & ~d63..0) 
StoreMemory(c,VirtAddr,size,order f rn) 
endlock 

endcase 
enddef 

Exceptions 

Access disallowed by virtual address 
Access disallowed by tag 
Access disallowed by global TB 
Access disallowed by local TB 
Access detail required by tag 
Access detail required by local TB 
Access detail required by global TB 
Local TB miss 
Global TB miss 

Fig. 52C (cont) 



Operation c des 



S.1.8 


Store immediate byte 


S.I.16AB 


Store immediate double aligned big-endian 


S.I.16.B 


Store immediate, double big-endian 


S.I.16AL 


Store immediate double aligned little-endian 


S.I.16.L 


Store immediate double little-endian 


S.I.32.A.B 


Store immediate quadlet aligned big-endian 


S.I.32.B 


Store immediate quadlet big-endian 


S.I.32AL 


Store immediate quadlet aligned little-endian 


S.I.32.L 


Store immediate quadlet little-endian 


S.I.64AB 


Store immediate octlet aligned big-endian 


S.I.64.B 


Store immediate octlet big-endian 


S.I.64AL 


Store immediate octlet aligned little-endian 


S.I.64.L 


Store immediate octlet little-endian 


S.I.128AB 


Store immediate hexlet aligned big-endian 


S.I.128.B 


Store immediate hexlet big-endian j 


S.I.128AL 


Store immediate hexlet aligned little-endian 


S.I.128.L 


Store immediate hexlet little-endian 


S.MUXI.64AB 


Store multiplex immediate octlet aligned big-endian 


S.MUXI.64AL 


Store multiplex immediate octlet aligned little-endian 



Fig. 53A 



Selection 



number format ! 


op 


size 


alignment 


ordering 


byte 




8 






integer 




16 32 64 128 




L B 


integer aligned 




16 32 64 128 


A 


L B 


multiplex 


MUX 


64 


A 


L B 



Format 



S.op.l.size.align.order rd.rc.offset 
sopisizealignorder(rd,rc t offset) 

31 24 23 18 17 12 11 0 

| op | rd | rc I offset" 



6 6 12 

Fig. 53B 



Definition 



def Storelmmediatefop.rd.rc.offset) as 
case op of 
SI8: 

size <- 8 
SI16L, SI16AL, SI16B, SI16AB: 

size «-16 
SI32L, SI32AL, SI32B, SI32AB: 

size +- 32 

SI64L, SI64AL, SI64B, SI64AB, SMUXI64AB, SMUXI64AL: 

size <- 64 
SI128L, SI128AL, SI128B, SI128AB: 

size <- 128 

endcase 
Isize «- log(size) 
case op of 
SI8: 

order <- undefined 
SI16L, SI32L, SI64L, SI128L, 
SI16AL, SI32AL, SI64AL, SI128AL, SMUXI64AL: 

order <- L 
SI16B, SI32B, SI64B, SI128B, 
SI16AB, SI32AB, SI64AB, SI128AB, SMUXI64AB: 

order <- B 

endcase 

c <- RegRead(rc, 64) 

VirtAddr <- c + (offset^ ,size || offset || 0 lsize * 3 ) 

case op of 

SI16AL, SI32AL, SI64AL, SI128AL, 
SI16AB, SI32AB, SI64AB, SI128AB, 
SMUXI64AB, SMUXI64AL: 
if (cisize-4..0 * 0 then 

raise AccessDisallowedByVirtualAddress 

endif 

SI16L, SI32L, SI64L, SI128L, 
SI16B, SI32B.SI64B, SI128B: 
SI8: 
endcase 



Fig. 53C 



d <- RegRead(rd, 128) 
case op of 
SI8. 

SI16L, SI16AL, SI16B, SI16AB, 
SI32L, SI32AL, SI32B, SI32AB, 
SI64L. SI64AL, SI64B, SI64AB, 
SI128L, SI128AL, SI128B, SI128AB: 

StoreMemory(c l VirtAddr t si2e,order,d S | ze -i..o) 
SMUXI64AB, SMUXI64AL: 

lock 

a ^- LoadMemoryWfc.VirtAddr.size.order) 

m <- (di27..64 & d 6 3..0) I (a & -d63..0) 
StoreMemory(c,VirtAddr f si2e,order f m) 
endlock 

endcase 
enddef 

Exceptions 

Access disallowed by virtual address 
Access disallowed by tag 
Access disallowed by global TB 
Access disallowed by local TB 
Access detail required by tag 
Access detail required by local TB 
Access detail required by global TB 
Local TB miss 
Global TB miss 

Fig. 53C (cont) 
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